framework,version,device,op_name,kernel_source,gemm_dtype,m,n,k,latency
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,10240,7.602173868815105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,12288,8.968806966145833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,16384,11.82825927734375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,7168,5.281282043457031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,6144,4.1443028767903645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,5120,3.430095926920573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,3584,2.1574666341145834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,3072,1.9201056162516277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,4096,2.4620020548502604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,1536,0.951807975769043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,2048,1.2019371032714843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,2560,1.4895445505777993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,768,0.48711465199788406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,512,0.36416746775309244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,1024,0.6726997375488282
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,256,0.2494453271230062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,128,0.19650559425354003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,64,0.1665023962656657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,32,0.1710762659708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,12288,1.8373984018961589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,16384,2.582497151692708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,10240,1.5512928009033202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,8192,1.2749504089355468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,6144,0.954641087849935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,7168,1.0810036977132162
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,4096,0.6034101486206055
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,5120,0.769604237874349
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,3584,0.5342528025309246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,3072,0.4802901268005371
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,2560,0.38618453343709314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,2048,0.3239935874938965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,1024,0.17134933471679686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,1536,0.23743146260579429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,512,0.09407146771748862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,768,0.13277866840362548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,256,0.06352320114771524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,128,0.05417066812515259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,64,0.04746880133946736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,32,0.04997119903564453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,16384,65536,11.983770751953125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,16384,1.9775488535563153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,12288,1.406329600016276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,10240,1.2068864186604817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,8192,0.9668597539265951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,7168,0.8695807774861655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,6144,0.6980266571044922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,4096,0.4713461240132649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,5120,0.6126581192016601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,3584,0.4197717348734538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,3072,0.3623242696126302
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,2048,0.24821759859720866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,2560,0.30016854604085286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,1024,0.12772586345672607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,1536,0.18879253069559734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,768,0.09919359683990478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,512,0.07417279879252116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,256,0.0507914662361145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,128,0.04198400179545085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,64,0.03979946772257487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,32,0.04225706656773885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,12288,65536,8.783329264322917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,12288,1.109675725301107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,16384,1.5959050496419271
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,8192,0.8295071919759115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,10240,0.9662805557250976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,6144,0.5916671752929688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,7168,0.7079253514607747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,4096,0.4015551884969075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,5120,0.4907349268595378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,3072,0.28958721160888673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,3584,0.3507189432779948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,2048,0.2049013296763102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,2560,0.2430954615275065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,1024,0.10397013028462727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,1536,0.15660266876220702
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,768,0.08106559912363688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,512,0.061953067779541016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,256,0.04130133390426636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,128,0.034474666913350424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,64,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,32,0.03242666721343994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,10240,65536,7.377752685546875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,16384,1.2410549163818358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,12288,0.9038165410359701
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,65536,8192,5.864042663574219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,8192,0.6368938446044922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,10240,0.8057514826456705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,7168,0.5557589213053385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,5120,0.40038401285807296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,6144,0.4660223960876465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,4096,0.3115008036295573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,3072,0.23866027196248374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,3584,0.2828960100809733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,1536,0.12704319953918458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,2048,0.16240639686584474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,2560,0.20032854080200196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,768,0.06761813163757324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,1024,0.08823466300964355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,512,0.04973119894663493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,256,0.034883201122283936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,128,0.029832533995310467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,64,0.02525866627693176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,32,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,12288,0.8003583908081054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,8192,65536,5.783416748046875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,16384,1.0527061462402343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,8192,0.5408085505167644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,10240,0.6919167836507161
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,7168,0.4791978518168132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,6144,0.4080992062886556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,5120,0.3440309206644694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,4096,0.2759338696797689
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,3584,0.23749972979227701
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,3072,0.20831467310587565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,2560,0.1751039981842041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,1536,0.10850986639658611
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,1024,0.07533120314280192
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,2048,0.13892265955607097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,256,0.030583467086156207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,768,0.05894720156987508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,512,0.043620268503824874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,128,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,64,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,32,0.0228000005086263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,12288,0.7258143742879232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,16384,0.92313601175944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,7168,65536,4.991934712727865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,10240,0.6161408106486003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,8192,0.4809045473734538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,7168,0.43683840433756516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,4096,0.24712427457173666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,5120,0.30173867543538413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,6144,0.358297602335612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,3072,0.1813162644704183
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,3584,0.21691733996073403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,2560,0.15223573048909506
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,1536,0.09598293304443359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,2048,0.12189013163248699
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,1024,0.0648202657699585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,512,0.037137067317962645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,768,0.05181440114974976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,256,0.032494932413101196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,128,0.023735467592875162
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,64,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,32,0.020537600914637247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,12288,0.6140949249267578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,16384,0.834012794494629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,6144,65536,4.159593709309896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,7168,0.3497642517089844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,8192,0.4201130549112956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,10240,0.5135711987813314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,4096,0.20333226521809897
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,6144,0.3055616060892741
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,5120,0.2596170743306478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,2560,0.13025386333465577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,3072,0.14888960520426434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,3584,0.17762986818949383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,1536,0.07662933667500814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,2048,0.1047210693359375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,1024,0.05403199990590414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,768,0.041368532180786136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,512,0.030855466922124226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,256,0.02292693257331848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,128,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,64,0.01972800095876058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,32,0.02053546706835429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,12288,0.537121073404948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,16384,0.6584320068359375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,5120,65536,3.4263425191243493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,7168,0.28344106674194336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,10240,0.40741545359293624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,8192,0.33481388092041015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,4096,0.16486293474833172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,5120,0.1999872048695882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,6144,0.23995626767476402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,3584,0.14472746849060059
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,2560,0.10239893595377605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,3072,0.12168533007303875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,1536,0.06365866661071777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,2048,0.08536746501922607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,1024,0.04389546712239583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,768,0.03420159816741943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,512,0.02573653260866801
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,256,0.018895999590555827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,128,0.016064000129699708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,64,0.016029866536458333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,32,0.01650879979133606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,12288,0.40973653793334963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,16384,0.5391701380411784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,4096,65536,2.650251770019531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,7168,0.24453120231628417
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,10240,0.3532458623250326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,8192,0.2907456080118815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,4096,0.14363412857055663
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,6144,0.20824747085571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,5120,0.17578667004903156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,3584,0.1263967990875244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,3072,0.10451626777648926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,2560,0.08976960182189941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,1536,0.054647465546925865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,1024,0.038780800501505536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,2048,0.07550293604532878
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,768,0.02921813329060872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,256,0.016850133736928306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,512,0.02169813315073649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,128,0.015476266543070475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,64,0.012786133090655008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,32,0.013058132926623025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,12288,0.36655893325805666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,16384,0.48827733993530276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3584,65536,2.2304779052734376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,7168,0.2214911937713623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,10240,0.32522239685058596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,8192,0.2623487949371338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,4096,0.12933119932810466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,5120,0.15830933252970378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,6144,0.18920106887817384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,3584,0.11376533508300782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,2560,0.08072640101114908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,3072,0.09625706672668458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,1536,0.04939093192418416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,2048,0.06727999846140544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,1024,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,768,0.02648640076319377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,512,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,256,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,128,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,64,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,32,0.012717866897583007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,12288,0.3062442779541016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,16384,0.4141397476196289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,3072,65536,1.9159381866455079
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,7168,0.18817706108093263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,10240,0.27340799967447915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,8192,0.2193749268849691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,4096,0.11284480094909669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,6144,0.1600170612335205
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,5120,0.13742079734802246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,3584,0.09932800134023032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,3072,0.08325119813283285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,2560,0.07157866954803467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,1536,0.04355413516362508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,1024,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,2048,0.05935786565144857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,768,0.023961599667867026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,256,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,512,0.01773653427759806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,128,0.011619200309117634
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,64,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,32,0.009955199559529622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,12288,0.24569066365559897
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,16384,0.33303893407185875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2560,65536,1.6545813242594403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,7168,0.15503360430399576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,10240,0.21957972844441734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,8192,0.17967999776204427
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,4096,0.08843839963277181
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,5120,0.10881706873575847
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,6144,0.13206186294555664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,3584,0.07826773325602213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,2560,0.05481813351313273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,3072,0.06567253271738688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,1536,0.03290346662203471
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,2048,0.04478293259938558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,1024,0.023552000522613525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,768,0.018549333016077675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,512,0.013640532890955607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,256,0.011526399850845337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,128,0.010288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,64,0.009545600414276123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,32,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,12288,0.19131733576456705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,2048,65536,1.2360032399495444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,10240,0.16513706843058268
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,8192,0.130457599957784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,6144,0.09717760086059571
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,7168,0.11755626996358234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,5120,0.08106986681620279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,4096,0.06594560146331788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,3584,0.05638826688130697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,3072,0.04966400067011516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,2560,0.040617601076761885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,2048,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,1536,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,1024,0.018692266941070557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,768,0.015683199961980185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,512,0.013401599725087485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,256,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,128,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,64,0.00951039989789327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,32,0.00790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,65536,0.9672373453776041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,12288,0.12563947041829426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,16384,0.16704853375752765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,8192,0.08765546480814615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,10240,0.10891839663187664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,6144,0.06666346788406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,7168,0.07693653106689453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,5120,0.05591359933217367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,4096,0.04403306643168132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,3584,0.039389868577321366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,3072,0.03345066706339518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,2560,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,2048,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,1536,0.01895786722501119
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,1024,0.013640532890955607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,768,0.012060800194740295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,512,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,256,0.0074869334697723385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,128,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,64,0.006293333570162455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,65536,0.6222848256429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1024,32,0.006201600035031637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,12288,0.09755199750264486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,16384,0.1269429365793864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,10240,0.08946346441904704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,8192,0.07075733343760172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,6144,0.05324906508127848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,7168,0.06311253309249878
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,5120,0.04478293259938558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,4096,0.0362496018409729
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,3584,0.03099306623140971
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,3072,0.02757973273595174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,2560,0.023414399226506552
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,2048,0.01964799960454305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,1536,0.015270400047302245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,1024,0.01162453293800354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,768,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,256,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,128,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,64,0.0062613333264986675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,32,0.006233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,768,65536,0.4944213231404622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,12288,0.07014400164286295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,16384,0.09171626567840577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,10240,0.05877866744995117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,8192,0.04720640182495117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,7168,0.04205226500829061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,6144,0.0359775980313619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,5120,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,4096,0.023347200949986775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,3584,0.021436800559361778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,3072,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,2560,0.016703999042510985
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,2048,0.01362986663977305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,1536,0.01165226697921753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,1024,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,768,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,512,0.0066442668437957765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,256,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,128,0.005160533388455709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,64,0.004996266464392344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,32,0.0054954667886098225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,512,65536,0.34457600911458336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,12288,0.043828264872233076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,16384,0.05867626667022705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,1536,16384,0.25886720021565757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,10240,0.03822933435440064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,8192,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,7168,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,6144,0.022326399882634483
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,5120,0.01691626707712809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,4096,0.01411626636981964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,3584,0.012810666362444559
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,3072,0.011115733782450359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,2560,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,2048,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,1024,0.006268799801667531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,1536,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,768,0.005851733187834421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,512,0.005037866532802582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,256,0.004542933404445648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,128,0.004373333354791006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,64,0.004026666780312856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,32,0.004382933179537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,12288,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,256,65536,0.2139125347137451
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,16384,0.04747946659723918
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,8192,0.024371200799942018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,7168,0.018899200359980266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,10240,0.030242133140563964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,6144,0.015406933426856995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,5120,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,4096,0.009545600414276123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,3584,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,3072,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,2560,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,1536,0.005891199906667074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,1024,0.005039999882380167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,2048,0.006701866785685222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,256,0.004069333275159201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,768,0.0046623999873797095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,512,0.004524800181388855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,128,0.004045866678158442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,64,0.0035957333942254386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,32,0.003973333289225897
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,12288,0.03413333495457967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,128,65536,0.1752405325571696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,16384,0.04843519926071167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,7168,0.01965120037396749
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,10240,0.029764266808827718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,8192,0.023894399404525757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,4096,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,5120,0.01029973328113556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,6144,0.015212800105412802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,3584,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,2560,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,3072,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,2048,0.006669866542021434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,1536,0.005825066566467285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,1024,0.005120000243186951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,512,0.004370133578777313
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,768,0.004621866842110952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,256,0.003928533444801966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,64,0.00363520011305809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,128,0.003655466685692469
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,32,0.0035360001027584078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,12288,0.03242773413658142
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,16384,0.05044906536738077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,64,65536,0.17114453315734862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,7168,0.01936639944712321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,10240,0.02791999975840251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,8192,0.021639466285705566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,4096,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,6144,0.014246400197347006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,5120,0.009548800190289815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,3584,0.0074314668774604796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,3072,0.007010133564472198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,2560,0.006200533111890157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,1536,0.005779199798901876
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,1024,0.004881066580613455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,2048,0.005449600021044413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,256,0.003942399968703588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,768,0.004744533201058706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,512,0.004231466849644979
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,128,0.0035946667194366455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,32,0.0035114665826161706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,12288,3.9034217834472655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,16384,5.809120178222656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,65536,0.16254293123881022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,8192,2.4971275329589844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,7168,2.3161888122558594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,10240,3.5935274759928384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,4096,1.2107775370279947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,5120,1.5793173472086588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,6144,1.957684326171875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,3072,0.9008127848307291
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,2560,0.7917568206787109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,3584,1.0682367960611978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,1536,0.49646933873494464
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,2048,0.6078122456868489
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,1024,0.33481388092041015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,512,0.1862346649169922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,768,0.2643285274505615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,256,0.12759040196736654
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,128,0.10151253541310627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,64,0.08587946891784667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,65536,32,0.0881322701772054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,12288,0.9079125086466471
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,16384,1.2228608449300131
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,8192,0.6443370819091797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,10240,0.8122357050577799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,7168,0.5660671869913737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,6144,0.4668416023254395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,5120,0.4111018816630046
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,4096,0.3107487996419271
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,3584,0.28447999954223635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,3072,0.23995733261108398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,2560,0.20544853210449218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,2048,0.1630890687306722
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,1536,0.1271125316619873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,1024,0.0868010679880778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,65536,5.456899007161459
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,768,0.06946132977803549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,256,0.03392746845881144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,512,0.05007253487904867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,128,0.029901866118113202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,64,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,16384,32,0.025942399104436235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,12288,0.761685307820638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,16384,0.8976064046223959
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,8192,0.4819295883178711
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,10240,0.6108842849731445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,7168,0.41437867482503254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,6144,0.3634175936381022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,5120,0.29395627975463867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,4096,0.239683198928833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,3584,0.20544959704081217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,3072,0.18097599347432453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,2560,0.14834027290344237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,2048,0.12274346351623536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,1536,0.09212586879730225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,65536,4.284657287597656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,1024,0.06509226560592651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,768,0.05010559956232706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,512,0.037887998421986896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,256,0.03242666721343994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,128,0.02327893376350403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,64,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,12288,32,0.02060479919115702
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,12288,0.6065845489501953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,16384,0.8082773208618164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,8192,0.41881599426269533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,10240,0.496947193145752
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,7168,0.361028258005778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,6144,0.31518828074137367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,5120,0.2564095973968506
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,4096,0.19944106737772624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,3584,0.17988266944885253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,3072,0.15004693667093913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,2560,0.12888747056325275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,2048,0.10219626426696778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,65536,3.573114776611328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,1536,0.08011093139648437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,1024,0.05457813342412313
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,768,0.04055253267288208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,512,0.031336534023284915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,256,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,128,0.020412800709406535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,64,0.018489599227905273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,10240,32,0.019308799505233766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,12288,0.47783253987630203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,16384,0.6480554580688477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,8192,0.3339946746826172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,10240,0.405026117960612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,7168,0.2907456080118815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,6144,0.24166399637858071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,5120,0.20524479548136393
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,4096,0.16049386660257975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,3584,0.14458880424499512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,3072,0.12195306619008381
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,2560,0.10492586294809977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,2048,0.08321812947591146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,65536,2.7155830383300783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,1536,0.06529813210169474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,1024,0.04416960080464681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,768,0.03324586749076843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,512,0.02573653260866801
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,128,0.01813760002454122
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,256,0.018897066513697304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,64,0.01923840045928955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,8192,32,0.01972800095876058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,12288,0.39813121159871423
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,16384,0.5442901611328125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,10240,0.34102506637573243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,8192,0.2899285316467285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,7168,0.24248000780741372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,6144,0.2168490727742513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,4096,0.1432917277018229
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,5120,0.17134826978047688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,3072,0.10390293598175049
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,3584,0.1257813294728597
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,2048,0.07410346666971843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,2560,0.08734613259633382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,1024,0.03740799824396769
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,1536,0.05655893484751383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,65536,2.035096486409505
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,768,0.029217066367467244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,512,0.022259199619293214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,256,0.016846932967503867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,128,0.014859732985496522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,64,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,7168,32,0.012786133090655008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8192,32,64,0.0035317334036032355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,10240,0.3179861386617025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,12288,0.3709962526957194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,16384,0.5171872138977051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,6144,0.19486826260884602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,8192,0.2564767996470133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,7168,0.22244693438212076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,4096,0.12639466921488446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,5120,0.16247572898864746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,3584,0.11144533157348632
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,2560,0.08219306468963623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,3072,0.09533440272013347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,2048,0.06461439927419027
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,1024,0.03426986535390218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,1536,0.05051733255386352
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,768,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,512,0.019844265778859456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,256,0.015552000204722086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,128,0.014061866203943887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,64,0.012026666601498922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,32,0.012409599622090657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,6144,65536,1.9228341420491535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,12288,0.3079509417215983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,16384,0.3980842590332031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,10240,0.26180267333984375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,8192,0.21746346155802407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,7168,0.18595840136210123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,6144,0.15469013849894206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,5120,0.13503146171569824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,4096,0.10512959957122803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,3584,0.09021440347035727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,3072,0.0809653361638387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,2560,0.06673173109690347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,2048,0.05307519833246867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,1024,0.029013333717981975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,1536,0.041915734608968094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,768,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,128,0.011583999792734782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,512,0.01731946667035421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,256,0.013639466961224875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,64,0.009923199812571209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,32,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,5120,65536,1.5488341013590494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,12288,0.2439861297607422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,16384,0.31566505432128905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,10240,0.21589226722717286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,8192,0.1718272050221761
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,7168,0.14574933052062988
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,5120,0.10591680208841961
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,6144,0.12608853181203206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,4096,0.08307946523030599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,3584,0.0741706689198812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,2560,0.05277226765950521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,3072,0.06410239934921265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,1536,0.03304106593132019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,2048,0.043484799067179364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,1024,0.023334399859110514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,768,0.01827413241068522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,512,0.014039466778437296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,256,0.011525332927703857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,128,0.010288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,64,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,32,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,4096,65536,1.265937042236328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,16384,0.3046741485595703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,12288,0.23145813941955568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,10240,0.18343146642049152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,8192,0.14458880424499512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,6144,0.11004479726155598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,7168,0.12622506618499757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,4096,0.07301013469696045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,5120,0.08919040362040201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,3584,0.06263573169708252
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,3072,0.055055999755859376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,2560,0.04512319962183635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,2048,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,1024,0.02004800041516622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,1536,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,768,0.01575573285420736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,512,0.012356266379356384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,256,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,128,0.0083146666487058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,64,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,32,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3584,65536,1.1585173288981119
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,12288,0.19472959836324055
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,16384,0.25128960609436035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,10240,0.15885653495788574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,8192,0.131822935740153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,7168,0.11335679690043132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,6144,0.09635840257008871
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,5120,0.08291093508402506
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,4096,0.064955735206604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,3584,0.0559445341428121
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,2048,0.03310933311780294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,2560,0.041915734608968094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,1024,0.018548266092936198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,1536,0.02539520064989726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,768,0.015133866667747497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,512,0.013155200084050498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,128,0.01043839951356252
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,256,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,64,0.009944533308347065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,32,0.010286933183670044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,65536,0.973687489827474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,16384,0.21712212562561034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,12288,0.1650005340576172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,10240,0.13632960319519044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,8192,0.10874880154927571
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,7168,0.09512960116068522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,6144,0.08140906492869059
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,5120,0.06809600194295248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,4096,0.054169599215189615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,3584,0.04730666478474935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,3072,0.040482131640116374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,2560,0.03413333495457967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,65536,0.8136704126993815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,2048,0.02757866581281026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,1536,0.02168853282928467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,1024,0.015271466970443726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,768,0.01242453356583913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,512,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,256,0.00827519992987315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,64,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,128,0.00739519993464152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2560,32,0.006666666766007741
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,12288,0.11990826924641926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,16384,0.16131307284037272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,10240,0.10711039702097576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,8192,0.08768746852874756
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,7168,0.0779263973236084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,6144,0.0670687993367513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,5120,0.05505706469217936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,4096,0.0445087989171346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,3584,0.03856746753056844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,3072,0.033861335118611655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,2560,0.028467200199762982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,2048,0.023949867486953734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,1536,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,65536,0.6152522404988606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,1024,0.014050133029619851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,768,0.011961600184440613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,512,0.009946667154630025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,128,0.007865599791208903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,64,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,256,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,2048,32,0.007490133245786031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,12288,0.09414186477661132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,16384,0.12670293649037678
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,10240,0.09004373550415039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,8192,0.0723626693089803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,7168,0.06198613246281942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,6144,0.05246400038401285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,5120,0.043347199757893876
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,4096,0.034679468472798666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,3584,0.030173865954081218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,3072,0.02662613391876221
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,2560,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,2048,0.018147200345993042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,65536,0.4819978713989258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,1536,0.014760532975196838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,1024,0.011185066898663838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,768,0.009947733084360758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,512,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,128,0.006326400240262349
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,64,0.006258133550484974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,256,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1536,32,0.006293333570162455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,12288,0.06683306694030762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,16384,0.08748266696929932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,10240,0.056081068515777585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,8192,0.04437333345413208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,7168,0.039800532658894855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,6144,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,5120,0.028943999608357744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,4096,0.0230730672677358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,3584,0.02157333294550578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,3072,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,2560,0.01690773367881775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,2048,0.01360426644484202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,65536,0.3346773465474447
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,1536,0.011945600310961407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,768,0.008236800134181977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,1024,0.009101866682370504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,512,0.0066997334361076355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,256,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,128,0.005295999844868978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,64,0.00520000010728836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,1024,32,0.005406933526198069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,12288,0.05174506505330404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,16384,0.06942719618479411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,8192,0.03536213239034017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,10240,0.04369066556294759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,6144,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,7168,0.03065173427263896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,5120,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,4096,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,3072,0.015270400047302245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,3584,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,2048,0.011205333471298217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,2560,0.013633066415786743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,1024,0.007894399762153625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,1536,0.009880533814430237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,65536,0.2694485346476237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,512,0.005884799857934316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,768,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,256,0.005171200136343638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,128,0.004587733248869578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,64,0.0044821331898371375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,768,32,0.005825066566467285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,16384,0.05058559974034628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,12288,0.039188265800476074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,8192,0.025940267244974773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,10240,0.03215893308321635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,6144,0.019317332903544107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,7168,0.02232426603635152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,5120,0.016489600141843162
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,4096,0.013572266697883606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,3584,0.0125408003727595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,3072,0.011142399907112122
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,2560,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,2048,0.008692266543706258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,65536,0.19097599983215333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,1536,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,768,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,1024,0.006267733375231425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,512,0.00528959979613622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,256,0.004589866598447164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,64,0.004030933231115341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,128,0.004373333354791006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,512,32,0.003949866692225138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,12288,0.027852799495061236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,16384,0.038023467858632407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,10240,0.02191466689109802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,8192,0.017324799299240114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,3072,3072,0.050177065531412754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,7168,0.01513706644376119
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,5120,0.012001066406567892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,6144,0.01360640029112498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,4096,0.010357333223025005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,3584,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,3072,0.00872320036093394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,2560,0.007935999830563863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,2048,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,1536,0.006267733375231425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,1024,0.005510400235652924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,768,0.005005866785844167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,512,0.0047872001926104225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,256,0.00409706657131513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,128,0.003937066594759623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,65536,0.11287893454233806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,32,0.004005333284536997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,256,64,0.003623466690381368
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,10240,0.015753600001335143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,12288,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,16384,0.029764266808827718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,7168,0.012401066223780314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,8192,0.013262933492660523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,6144,0.010785067081451416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,5120,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,3584,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,4096,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,3072,0.007076266904671986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,2560,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,2048,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,1024,0.004810666541258494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,1536,0.005444266895453135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,768,0.00439573327700297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,256,0.003964799890915553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,512,0.004102399945259095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,128,0.003655466685692469
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,64,0.0034986667335033415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,32,0.0036501333117485045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,128,65536,0.093012269337972
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,12288,0.018343466520309448
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,16384,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,10240,0.015689599514007568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,8192,0.012809600432713827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,7168,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,6144,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,5120,0.009194667140642803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,4096,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,3584,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,3072,0.006702933212121327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,2560,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,2048,0.0057888001203536986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,1536,0.005030400057633718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,1024,0.0045525332291920986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,768,0.004306133091449738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,256,0.0036831999818483984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,512,0.004011733333269755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,64,0.0032586666444937387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,32,0.0034965333839257562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,128,0.0035114665826161706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,64,65536,0.09018026987711589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,12288,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,16384,0.025326933463414508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,10240,0.01236799955368042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,8192,0.011148800452550251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,7168,0.009946667154630025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,5120,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,6144,0.009136000275611877
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,4096,0.009966933727264404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,2560,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,3584,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,3072,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,1536,0.004934399823347728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,2048,0.0055061335364977515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,1024,0.004439466694990794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,512,0.004149333387613296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,768,0.004299733539422353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,256,0.0036746665835380556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,128,0.003619199991226196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,64,0.00322026660044988
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,32,0.0030826665461063385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4096,32,65536,0.08837119738260904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,12288,1.937135950724284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,10240,1.6167957305908203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,8192,1.225661849975586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,16384,2.7492022196451824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,7168,1.1182762145996095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,6144,0.9233397165934244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,4096,0.6205098470052083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,5120,0.7407274881998698
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,2048,0.31423041025797527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,2560,0.3887786547342936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,3584,0.5616298675537109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,3072,0.4739413261413574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,1024,0.17346453666687012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,1536,0.24111572901407877
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,768,0.1340768019358317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,512,0.09676799774169922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,128,0.053931732972462974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,256,0.06601386864980062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,64,0.04952746629714966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,65536,32,0.04881173372268677
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,12288,0.49025707244873046
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,10240,0.40311253865559893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,16384,0.64672425587972
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,8192,0.32839787801106773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,6144,0.23770453135172526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,7168,0.27955201466878254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,4096,0.16015146573384603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,5120,0.20381013552347818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,3584,0.14131199518839518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,3072,0.12191359996795655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,2560,0.10508266290028889
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,2048,0.08359253406524658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,1536,0.06410026550292969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,1024,0.04587626854578654
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,768,0.035019731521606444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,512,0.02553173303604126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,256,0.01930453379948934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,128,0.01811306675275167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,65536,2.774736022949219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,64,0.019428267081578573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,16384,32,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,10240,0.32983039220174154
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,12288,0.3676512082417806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,16384,0.4729162534077962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,7168,0.22340265909830728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,8192,0.265010134379069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,6144,0.1878357410430908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,4096,0.13028799692789714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,5120,0.15776534080505372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,3584,0.10987626711527507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,2048,0.06379520098368327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,2560,0.08024746576944987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,3072,0.09861120382944742
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,1024,0.034680533409118655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,1536,0.04912746747334798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,768,0.027715200185775758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,512,0.020660267273585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,256,0.016023466984430947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,128,0.014389333128929139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,65536,1.8676053365071614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,32,0.012777599692344665
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,12288,64,0.012366933623949687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,10240,0.27770878473917643
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,12288,0.2942303975423177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,16384,0.4037290573120117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,8192,0.2205344041188558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,7168,0.1892031987508138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,6144,0.16417600313822428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,4096,0.10748693148295085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,5120,0.13564799626668295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,3584,0.09659732977549235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,3072,0.08164693514506022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,2560,0.06973546346028646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,2048,0.057309865951538086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,1024,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,1536,0.043689600626627606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,65536,1.5594154357910157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,512,0.018480000893274943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,256,0.0141184002161026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,768,0.02443839907646179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,128,0.013979732990264893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,32,0.011994666854540507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,12288,0.24200426737467445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,16384,0.3325610796610514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,10240,0.2069514592488607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,8192,0.1703231970469157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,7168,0.14315412839253744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,6144,0.12851200103759766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,5120,0.10257066885630291
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,4096,0.08611839612325033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,65536,1.250167465209961
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,3584,0.07314559618631998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,3072,0.06560426553090414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,2560,0.05403306484222412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,1536,0.034406399726867674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,2048,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,512,0.016500266393025716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,768,0.01986560026804606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,1024,0.02409600019454956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,256,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,128,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,64,0.010775466759999592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,8192,32,0.011126400033632914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,12288,0.20537919998168946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,16384,0.2778474807739258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,10240,0.1731925328572591
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,8192,0.14172266324361166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,7168,0.12107093334197998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,6144,0.1057802677154541
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,5120,0.08635733127593995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,4096,0.07120213508605958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,65536,1.0880011240641276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,3584,0.06154239972432455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,2560,0.04693439801534017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,3072,0.05444266796112061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,2048,0.03659093379974365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,1536,0.028804266452789308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,768,0.016296533743540446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,1024,0.020538665850957236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,256,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,512,0.012273066242535909
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,128,0.00872320036093394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,64,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,7168,32,0.007906133433183034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,12288,0.18933760325113932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,16384,0.24152746200561523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,10240,0.16309119860331217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,8192,0.12363093694051105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,6144,0.09911999702453614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,7168,0.11264106432596843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,5120,0.07782399654388428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,4096,0.066594131787618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,65536,0.9342293421427408
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,3584,0.05618346532185873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,3072,0.05045013427734375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,2048,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,1536,0.027236266930898027
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,2560,0.04184533357620239
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,1024,0.018889600038528444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,768,0.015346133708953857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,512,0.01316480040550232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,256,0.01076586643854777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,128,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,64,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,6144,32,0.010150399804115296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,12288,0.16356800397237142
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,16384,0.21964586575826012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,10240,0.13192533651987712
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,8192,0.10718080202738445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,7168,0.09072533448537191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,6144,0.07956480185190837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,5120,0.06502293348312378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,4096,0.05382826725641886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,65536,0.8567455927530924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,3584,0.046147199471791585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,2560,0.035155200958251955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,3072,0.04082346757253011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,2048,0.02764799992243449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,1536,0.022459733486175536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,768,0.012641066312789917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,1024,0.015927466750144958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,512,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,256,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,128,0.007427200178305308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,64,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,5120,32,0.006667733192443848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,12288,0.11909120082855225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,16384,0.16370347340901692
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,10240,0.1040725310643514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,8192,0.08615360260009766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,7168,0.07260159651438394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,6144,0.06451093355814616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,5120,0.05218986670176188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,4096,0.04369066556294759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,65536,0.6544384002685547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,3584,0.03795733451843262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,3072,0.03379199902216594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,2048,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,1536,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,1024,0.014644267161687216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,768,0.011523200074831645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,512,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,256,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,128,0.007115733126799266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,64,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,32,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,16384,0.15387199719746908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,12288,0.11649706363677978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,10240,0.10629013379414876
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,65536,0.6330015818277995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,8192,0.08482240041097006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,7168,0.07765226364135742
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,6144,0.06369173526763916
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,5120,0.05546666781107584
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,4096,0.04300800164540609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,3072,0.03317760030428569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,3584,0.03932160139083862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,2560,0.028126933177312213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,2048,0.024165334304173787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,1536,0.01904639999071757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,1024,0.014392532904942832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,768,0.011991467078526814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,512,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,256,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,128,0.006233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,64,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3584,32,0.005826133489608765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,16384,0.12625919977823893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,12288,0.09581333001454671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,10240,0.0855733315149943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,65536,0.4759210586547852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,8192,0.06802666982014974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,7168,0.05707199970881144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,6144,0.05048319896062216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,5120,0.0409610668818156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,4096,0.0339957316716512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,3584,0.029148799180984498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,3072,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,2560,0.021844265858332317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,1536,0.014999467134475707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,1024,0.011586133639017742
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,768,0.009593600034713745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,512,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,256,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,128,0.007009066641330719
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,64,0.00660159985224406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,32,0.006602666775385539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,65536,0.41011091868082683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,16384,0.1071775992711385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,12288,0.08144213358561198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,10240,0.0686090628306071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,8192,0.05461440086364746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,10240,64,0.01242453356583913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,7168,0.04761600097020467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,6144,0.041230932871500654
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,5120,0.03433813254038493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,4096,0.028398933013280232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,3584,0.024848000208536784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,3072,0.02198293407758077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,2560,0.01877440015474955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,2048,0.015737600127855935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,1536,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,1024,0.009897599617640179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,768,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,512,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,256,0.006566399832566579
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,128,0.00581333339214325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,64,0.00544213354587555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2560,32,0.005478399991989136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,16384,0.08506027062733969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,12288,0.06437546809514363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,10240,0.05423680146535238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,65536,0.32549546559651693
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,8192,0.04355413516362508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,6144,0.03379199902216594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,7168,0.03781973520914714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,4096,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,5120,0.028947200377782183
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,3584,0.02136853337287903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,3072,0.019454934199651084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,2048,0.014724266529083253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,2560,0.016567466656366985
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,1024,0.009127466877301534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,1536,0.011642666657765706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,768,0.008274133503437042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,512,0.00697813332080841
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,256,0.005884799857934316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,128,0.005474133292833964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,64,0.005064533154169718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,2048,32,0.005063466727733612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,16384,0.06946132977803549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,12288,0.05280426740646362
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,10240,0.0443061351776123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,8192,0.03604480028152466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,7168,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,6144,0.027509333690007527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,5120,0.023552000522613525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,4096,0.019661867618560792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,3584,0.017272533973058064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,3072,0.015408000349998474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,2560,0.013633066415786743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,2048,0.012051199873288471
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,1536,0.009910399715105694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,1024,0.00810346653064092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,768,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,512,0.006259199976921081
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,256,0.005406933526198069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,128,0.004587733248869578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,64,0.004231466849644979
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,32,0.0045525332291920986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,65536,0.1842517375946045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,16384,0.048093867301940915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,12288,0.03631786505381267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,4096,2560,0.028603732585906982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,10240,0.02969706654548645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,8192,0.024100265900293984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,7168,0.022050132354100548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,6144,0.018694400787353516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,5120,0.016568533579508462
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,4096,0.013470932841300964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,3584,0.012437333663304646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,3072,0.010771200060844421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,2560,0.009965866804122925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,1536,0.007865599791208903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,2048,0.008654933174451191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,1024,0.0062943999965985615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,768,0.005448533097902933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,512,0.004995200037956238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,256,0.004458666841189066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,128,0.004382933179537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,32,0.004046933352947235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1024,64,0.00403413325548172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,16384,0.04376000165939331
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,12288,0.032631466786066696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,10240,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,65536,0.16418132781982422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,8192,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,7168,0.02020906607309977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,6144,0.017670400937398276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,5120,0.01567893326282501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,3584,0.012025599678357441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,4096,0.013266133268674216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,3072,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,2560,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,2048,0.008713600039482117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,1536,0.0074976002176602675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,1024,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,768,0.005858133236567179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,512,0.0054058666030565895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,128,0.004420266548792521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,256,0.004911999901135763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,64,0.0044053331017494205
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,768,32,0.004334933559099833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,16384,0.0318122665087382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,3072,2048,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,12288,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,10240,0.020127999782562255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,8192,0.017257599035898845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,65536,0.10233173370361329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,7168,0.015212800105412802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,6144,0.01360640029112498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,5120,0.012014933427174886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,4096,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,3584,0.009513599673906963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,3072,0.008712533116340637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,2560,0.00790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,1536,0.006292266647020976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,2048,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,1024,0.005380266904830932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,768,0.005184000233809153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,512,0.00481386681397756
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,256,0.004103466620047887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,128,0.003960533440113068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,32,0.003572266548871994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,512,64,0.0036960000793139136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,12288,0.01814613342285156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,16384,0.020275199413299562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,8192,0.013507200280825296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,10240,0.016035200158754984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,7168,0.012001066406567892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,6144,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,5120,0.009476266304651896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,65536,0.06218986511230469
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,4096,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,3584,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,3072,0.007283199826876323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,2560,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,1536,0.0054624001185099285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,2048,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,1024,0.00492799977461497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,768,0.0044608001907666525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,512,0.003961600114901861
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,256,0.003967999915281932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,128,0.0036831999818483984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,64,0.0035274667044480645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,256,32,0.003470933437347412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,16384,0.014051199952761332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,12288,0.014393599828084311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,10240,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,8192,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,7168,0.011558399597803751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,6144,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,5120,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,65536,0.050551466147104894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,4096,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,3584,0.007427200178305308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,3072,0.007043200234572093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,2560,0.006260266900062561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,1536,0.005063466727733612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,2048,0.005448533097902933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,1024,0.004474666714668274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,768,0.004327466587225596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,512,0.0038933334251244865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,256,0.003651199986537298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,128,0.0035274667044480645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,64,0.0032042667269706728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,128,32,0.003606399893760681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,16384,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,12288,0.01285546620686849
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,10240,0.011556266744931539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,8192,0.010307199756304423
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,7168,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,6144,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,5120,0.008385066191355388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,65536,0.04696746667226155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,4096,0.00787306676308314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,3584,0.007084799806276958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,3072,0.006669866542021434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,2560,0.006132266422112783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,2048,0.0055978665749231975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,1536,0.005031466484069824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,1024,0.004531200230121613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,512,0.003933866570393244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,768,0.004368000229199727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,256,0.0037685332198937735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,128,0.0035861333211263022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,64,0.0032501332461833954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,64,32,0.0033258666594823206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,16384,0.010788266857465107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,12288,0.009065600236256917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,10240,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,8192,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,7168,0.01151146690050761
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,6144,0.010856533050537109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,5120,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,65536,0.04693333307902019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,4096,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,3584,0.007052800059318543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,3072,0.006701866785685222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,2560,0.005927466849486033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,1536,0.005051733553409576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,2048,0.005379199981689453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,1536,65536,0.2637824058532715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,1024,0.004522666831811269
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,768,0.004072533299525579
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,512,0.0039658665657043455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,256,0.003622400015592575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,128,0.003230933348337809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,64,0.0032405334214369455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2048,32,32,0.003542399903138479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,8192,0.6537216186523438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,10240,0.7954432169596355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,12288,0.9219733556111654
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,16384,1.2087285359700521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,7168,0.5698240280151368
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,6144,0.48636585871378585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,4096,0.32160425186157227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,5120,0.4000426610310872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,3584,0.29368321100870765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,2560,0.20510719617207845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,3072,0.24821759859720866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,2048,0.16998400688171386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,1536,0.13185706933339436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,1024,0.08816640377044678
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,768,0.07055359681447347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,512,0.051677866776784265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,128,0.03051626682281494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,64,0.02765120069185893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,256,0.03556693394978841
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,65536,32,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,12288,0.2527232011159261
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,16384,0.3288042704264323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,10240,0.2128906726837158
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,8192,0.17442132631937662
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,7168,0.1505280017852783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,6144,0.12850986321767172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,5120,0.10987520217895508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,4096,0.09173973401387533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,3584,0.08117120265960694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,2560,0.05908480087916056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,3072,0.07147520383199056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,65536,1.2483275095621744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,2048,0.04840000073115031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,1536,0.03549866676330567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,1024,0.025326933463414508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,768,0.01998186707496643
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,512,0.016850133736928306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,256,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,128,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,64,0.01076586643854777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,16384,32,0.011116799712181092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,12288,0.19698239962259928
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,16384,0.27265707651774085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,10240,0.16069973309834798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,8192,0.12674132982889813
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,7168,0.1152341365814209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,6144,0.09970453580220541
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,5120,0.07973546981811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,4096,0.06826666990915933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,3584,0.05894933144251505
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,3072,0.04983466863632202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,2560,0.04403093258539836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,65536,1.0245791753133138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,2048,0.03536320130030314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,1536,0.026897066831588747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,1024,0.01978666583697001
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,768,0.01609173317750295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,256,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,512,0.01381013294061025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,128,0.010431999961535137
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,64,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,12288,32,0.010014933347702027
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,12288,0.1668437321980794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,16384,0.22674880027770997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,10240,0.14045759836832683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,8192,0.11482346852620443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,6144,0.08434453010559081
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,7168,0.10311679840087891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,4096,0.05672959884007772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,5120,0.07127040227254232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,3584,0.05202026764551798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,3072,0.04348586797714234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,2560,0.037342933813730876
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,2048,0.031402667363484696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,65536,0.8426154454549154
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,1536,0.023550933599472045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,1024,0.017864533265431724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,768,0.014392532904942832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,512,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,256,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,128,0.008615466952323913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,64,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,10240,32,0.00790826678276062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,12288,0.12827200094858807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,16384,0.16520533561706544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,10240,0.10765653451283771
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,8192,0.08826879660288492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,7168,0.07567359606424967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,6144,0.06519466638565063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,4096,0.04464639822642009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,5120,0.05573973258336386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,3584,0.03932266632715861
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,65536,0.6194186528523763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,3072,0.034406399726867674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,2560,0.029491200049718218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,1536,0.019573332866032918
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,1024,0.015201066931088766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,2048,0.0245088001092275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,768,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,512,0.009946667154630025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,256,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,64,0.007904000083605449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,128,0.006984533369541168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,8192,32,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,16384,0.14731839497884114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,10240,0.08987306753794352
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,12288,0.10885120232899984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,7168,0.06403413216272989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,8192,0.07567253112792968
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,6144,0.06328426599502564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,5120,0.05184959967931112
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,4096,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,3584,0.03809386491775513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,65536,0.5588981628417968
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,3072,0.03188160061836243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,2560,0.02826346755027771
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,2048,0.02285760045051575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,1536,0.0180021325747172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,1024,0.013290666540463767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,768,0.010797866185506185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,256,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,512,0.00831573357184728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,128,0.0062613333264986675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,64,0.005448533097902933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,7168,32,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,12288,0.10260266462961834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,16384,0.129911470413208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,10240,0.08468266328175864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,7168,0.05870933135350546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,6144,0.05065279801686605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,8192,0.06987093289693197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,5120,0.04171200195948283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,4096,0.03433706760406494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,3584,0.03099199930826823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,65536,0.5178698539733887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,2560,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,3072,0.026281599203745527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,2048,0.01945599913597107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,768,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,1024,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,1536,0.015482667088508605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,256,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,128,0.007011199990908305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,64,0.0065760001540184024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,6144,32,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,12288,0.08547093073527018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,16384,0.11130879720052082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,10240,0.07164479891459147
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,8192,0.05881173213322958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,7168,0.0497322678565979
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,6144,0.043117864926656084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,4096,0.029284266630808513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,5120,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,3584,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,65536,0.4172800064086914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,3072,0.022849067052205404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,2560,0.02005866765975952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,1536,0.013564800222714743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,2048,0.01664426624774933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,1024,0.010356266299883525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,768,0.008726400136947633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,512,0.007524266839027405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,128,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,256,0.006607999900976817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,64,0.005448533097902933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,5120,32,0.00544106662273407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,12288,0.06594560146331788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,10240,0.05331733226776123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,16384,0.08526506423950195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,7168,0.038091735045115156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,8192,0.04498773415883382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,6144,0.03386026620864868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,5120,0.028194133440653486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,4096,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,3584,0.02108373244603475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,65536,0.3257354736328125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,3072,0.01827626625696818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,2560,0.016235733032226564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,1536,0.01160533328851064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,2048,0.013673599561055502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,1024,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,768,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,512,0.007075199981530507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,128,0.004997333387533823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,64,0.0046293333172798155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,256,0.005787733197212219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,4096,32,0.004621866842110952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,10240,0.054749866326649986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,16384,0.08823359807332357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,12288,0.06543466647466024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,8192,0.04416960080464681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,7168,0.03966399828592936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,6144,0.0337226668993632
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,5120,0.029014400641123456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,4096,0.02430293361345927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,3584,0.02190293272336324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,65536,0.32675838470458984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,3072,0.019845332702000937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,2560,0.01691733400026957
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,1536,0.01202880044778188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,2048,0.014678399761517844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,1024,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,768,0.007906133433183034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,512,0.006704000135262807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,256,0.005791999896367391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,128,0.004996266464392344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,64,0.004556799928347269
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3584,32,0.004587733248869578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,10240,0.04212053219477336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,12288,0.05202026764551798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,16384,0.06751573085784912
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,8192,0.03413333495457967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,6144,0.02682773272196452
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,7168,0.030923734108606975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,5120,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,4096,0.019230933984120686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,3584,0.01732800006866455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,65536,0.259549872080485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,3072,0.015270400047302245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,2560,0.014110933740933737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,2048,0.011594667037328085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,1024,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,768,0.007077333331108093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,512,0.006234666705131531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,1536,0.009546666344006857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,256,0.00544106662273407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,128,0.005065600077311197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,64,0.004970666766166687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,3072,32,0.004853333532810211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,12288,0.044513066609700516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,16384,0.057275732358296715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,10240,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,7168,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,8192,0.030242133140563964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,6144,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,5120,0.019500799973805747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,4096,0.01664426624774933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,3584,0.01490239997704824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,65536,0.21486934026082358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,3072,0.013858133554458618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,2560,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,1536,0.008718933661778767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,2048,0.009955199559529622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,1024,0.007112533350785573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,768,0.006267733375231425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,512,0.005611733098824819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,128,0.004760533571243286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,256,0.005231999854246775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,64,0.004380799829959869
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2560,32,0.004212266703446706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,10240,0.02969706654548645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,12288,0.03645439942677815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,16384,0.04748266537984212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,8192,0.02430293361345927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,6144,0.019374932845433554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,5120,0.016567466656366985
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,65536,0.18186240196228026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,4096,0.013878400127092997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,3584,0.012437333663304646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,3072,0.011195733149846395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,2560,0.009516800443331402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,2048,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,1536,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,768,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,1024,0.006231466432412466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,512,0.0052714665730794275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,256,0.004782933493455251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,128,0.004412800073623657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,64,0.004328533510367076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,32,0.004266666869322458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,12288,0.029217066367467244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,16384,0.03911679983139038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,10240,0.024577067295710246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,8192,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,6144,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,7168,0.018024533987045288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,65536,0.1469098726908366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,4096,0.01165120005607605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,5120,0.01437226633230845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,3584,0.011128532886505126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,3072,0.010016000270843506
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,2560,0.009060266613960265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,1536,0.007009066641330719
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,1024,0.00584853341182073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,2048,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,768,0.0054058666030565895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,512,0.005016533533732096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,256,0.0048096001148223875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,128,0.004494933287302653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,64,0.004320000112056732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1536,32,0.0043818667531013485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,16384,0.032631466786066696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,12288,0.023826134204864503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,10240,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,8192,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,7168,0.01574613352616628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,65536,0.09728000164031983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,6144,0.014084266622861228
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,5120,0.012469333410263062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,4096,0.010797866185506185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,3072,0.008785067001978557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,2560,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,3584,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,2048,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,1536,0.006295466423034668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,1024,0.005649066468079885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,512,0.004554666578769684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,768,0.005026133358478546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,256,0.00447680006424586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,128,0.004357333481311798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,64,0.004045866678158442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,1024,32,0.004065066576004028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,16384,0.02696533401807149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,12288,0.018962132930755615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,10240,0.016978132724761962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,8192,0.014082133769989014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,7168,0.013255467017491659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,65536,0.08284160296122232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,6144,0.011527466773986816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,5120,0.010718933741251628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,4096,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,3072,0.00786240001519521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,2560,0.00701333334048589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,3584,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,1536,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,2048,0.006253866851329804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,1024,0.005074133475621542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,768,0.004657066861788432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,512,0.004488533238569895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,256,0.004060799876848856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,128,0.003920000046491623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,64,0.0039264000952243805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,768,32,0.0036778666079044344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,16384,0.020733867088953653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,12288,0.018900267283121743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,10240,0.016327466567357382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,8192,0.013266133268674216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,7168,0.012444800138473511
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,65536,0.05536533196767172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,5120,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,6144,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,4096,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,3584,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,2560,0.006567466755708058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,3072,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,1536,0.005166933437188466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,2048,0.00588266650835673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,1024,0.004789333542188009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,768,0.004259199897448222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,512,0.00408746674656868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,256,0.004031999905904134
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,64,0.0035071998834609987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,32,0.0035242666800816857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,16384,0.01479039986928304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,12288,0.014014933506647745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,65536,0.0373418649037679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,8192,0.012869333227475485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,10240,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,7168,0.011991467078526814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,6144,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,5120,0.009124267101287841
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,4096,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,3584,0.007485866546630859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,3072,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,2560,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,1536,0.00528959979613622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,2048,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,1024,0.004711466530958811
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,768,0.004379733403523763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,512,0.0040501333773136135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,256,0.003638399889071783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,128,0.003500800083080927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,32,0.0035242666800816857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,256,64,0.0031871999303499854
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,16384,0.01072746713956197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,12288,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,65536,0.02935466567675273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,10240,0.011558399597803751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,8192,0.010377599795659383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,7168,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,6144,0.009127466877301534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,4096,0.007999999821186066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,5120,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,3584,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,3072,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,2560,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,2048,0.005666133264700572
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,1536,0.005051733553409576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,1024,0.004565333326657614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,768,0.004327466587225596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,256,0.003684266656637192
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,512,0.004014933357636133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,128,0.0035103999078273775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,64,0.0032298666735490165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,128,32,0.0036170666416486105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,16384,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,12288,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,10240,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,65536,0.027306665976842243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,8192,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,7168,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,6144,0.007485866546630859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,5120,0.007905066510041555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,4096,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,3584,0.007051733136177063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,3072,0.00660159985224406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,2560,0.005850666761398315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,2048,0.005474133292833964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,1024,0.004387199878692627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,1536,0.0048320000370343525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,768,0.004364799956480662
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,512,0.003933866570393244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,256,0.0035466666022936503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,128,0.00325546662012736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,64,0.0033173332611719764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,64,32,0.003230933348337809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,16384,0.0123989333709081
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,12288,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,65536,0.025804799795150758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,8192,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,10240,0.009545600414276123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,7168,0.00871573289235433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,6144,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,5120,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,4096,0.007496533294518788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,3584,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,3072,0.006607999900976817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,2560,0.00588266650835673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,1536,0.00544106662273407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,2048,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,1024,0.004852266609668731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,768,0.0043722664316495265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,512,0.003885866701602936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,256,0.0035904000202814737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,128,0.0035146666069825493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,32,0.003538133452335993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,32,64,0.0032149332265059153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,12288,0.7965695699055989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,16384,0.9822901407877603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,10240,0.6653952280680339
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,8192,0.5186901410420736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,6144,0.4016127904256185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,7168,0.4631200154622396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,5120,0.33467626571655273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,4096,0.26774187088012696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,3584,0.23296000162760416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,3072,0.20080639521280924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,2560,0.16786880493164064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,2048,0.13666987419128418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,1536,0.10816746552785236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,1024,0.07666453520456949
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,768,0.06099626620610556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,512,0.04478186766306559
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,256,0.03331413269042969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,128,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,64,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,65536,32,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,2048,7168,0.02218559980392456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,16384,0.2602325280507406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,12288,0.20066986083984376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,10240,0.17223679224650065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,65536,1.000106684366862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,8192,0.1418570677439372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,7168,0.12192426522572834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,6144,0.10513066450754802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,5120,0.0898805300394694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,4096,0.06809279918670655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,3584,0.06021120150883993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,3072,0.05311146577199301
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,2560,0.04403520027796427
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,2048,0.03618133465449015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,1536,0.028398933013280232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,1024,0.019853866100311278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,768,0.016089600324630738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,512,0.014050133029619851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,128,0.01069760024547577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,256,0.01111466685930888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,64,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,16384,32,0.010218666990598042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,16384,0.18926933606465657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,12288,0.1402880032857259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,10240,0.12813653151194254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,8192,0.10123946666717529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,6144,0.07703999678293863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,7168,0.09075946807861328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,65536,0.7162538528442383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,5120,0.06454613208770751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,4096,0.05259946584701538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,3584,0.045465600490570066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,3072,0.03911573489507039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,2560,0.033928533395131424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,2048,0.02757973273595174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,1536,0.02157013416290283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,1024,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,512,0.010834133625030518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,256,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,768,0.013264000415802002
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,128,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,64,0.006233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,12288,32,0.006267733375231425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,16384,0.1628149350484212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,12288,0.1203541358311971
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,10240,0.10315093199412029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,8192,0.08424320220947265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,7168,0.07488853136698405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,65536,0.6286336263020833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,6144,0.06328426599502564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,5120,0.05451093514760336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,4096,0.043212799231211345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,3584,0.03850239912668864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,3072,0.033861335118611655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,2560,0.028056534131368
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,2048,0.023336533705393472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,1024,0.013700266679128012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,1536,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,768,0.011129599809646607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,512,0.010151466727256775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,256,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,64,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,32,0.00790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,10240,128,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,12288,0.09844053586324056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,16384,0.13400640487670898
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,8192,0.07099733352661133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,10240,0.08635093371073405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,7168,0.062362666924794516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,65536,0.49906241099039717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,6144,0.05235946575800578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,5120,0.0445087989171346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,4096,0.035361067454020186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,3584,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,3072,0.02778559923171997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,2560,0.023483733336130776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,2048,0.019577600558598838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,1024,0.012026666601498922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,1536,0.015962666273117064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,512,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,768,0.009910399715105694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,256,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,128,0.007077333331108093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,32,0.006611200173695882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,8192,64,0.006611200173695882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,16384,0.11636053721110026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,12288,0.08635733127593995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1024,512,128,0.00363520011305809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,10240,0.07625493208567301
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,8192,0.059835731983184814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,7168,0.05137173334757487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,6144,0.04628373384475708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,65536,0.4487157185872396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,5120,0.038365864753723146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,4096,0.030717867612838744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,3584,0.028195200363794963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,3072,0.02430400053660075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,2048,0.017249067624409996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,2560,0.02074133356412252
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,1024,0.010357333223025005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,1536,0.014051199952761332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,768,0.009060266613960265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,512,0.007496533294518788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,256,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,128,0.005447466671466827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,64,0.004997333387533823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,7168,32,0.005287466446558634
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,12288,0.07284159660339355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,16384,0.09983893235524496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,10240,0.06260159810384115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,8192,0.04979946613311768
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,7168,0.04560533364613851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,6144,0.03891306718190511
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,5120,0.032085333267847696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,4096,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,65536,0.37778774897257483
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,3072,0.020615466435750327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,3584,0.023962666591008507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,2048,0.01574720044930776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,1536,0.012843733032544455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,512,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,1024,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,256,0.005851733187834421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,128,0.005004799862702688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,64,0.004996266464392344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,6144,32,0.004850133260091146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,12288,0.06505706707636515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,16384,0.08769066333770752
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,10240,0.054681599140167236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,8192,0.04423679908116658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,7168,0.040140799681345624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,6144,0.03399786551793416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,5120,0.02921813329060872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,65536,0.3275775909423828
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,4096,0.02402879993120829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,3584,0.021423999468485513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,3072,0.019640533129374187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,2560,0.016973867019017538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,2048,0.014938666423161825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,1024,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,1536,0.01251413325468699
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,768,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,512,0.006985599795977275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,256,0.006095999975999197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,64,0.005064533154169718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,32,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,5120,128,0.005346133311589559
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,16384,0.0667306661605835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,12288,0.05287359952926636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,10240,0.043622398376464845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,8192,0.034886399904886886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,7168,0.03181119958559672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,6144,0.027164800961812334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,5120,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,4096,0.01945599913597107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,65536,0.2618218739827474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,3584,0.01732800006866455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,3072,0.015338666240374246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,2560,0.013844266533851624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,2048,0.012436266740163167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,1536,0.009750399986902874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,1024,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,512,0.0065642664829889934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,768,0.007051733136177063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,128,0.004997333387533823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,256,0.005416533350944519
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,64,0.004670933385690053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,4096,32,0.005004799862702688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,10240,0.038363734881083175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,12288,0.04498773415883382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,16384,0.05894613265991211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,7168,0.027305599053700762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,8192,0.031336534023284915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,6144,0.023960532744725545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,65536,0.222651735941569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,5120,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,4096,0.01726186672846476
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,3584,0.015378133455912272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,3072,0.013597866892814637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,2560,0.012198399504025776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,1536,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,1024,0.007012266914049785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,768,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,512,0.005448533097902933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,128,0.0045045331120491024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,64,0.004379733403523763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,32,0.004253866771856943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3584,256,0.004658133288224538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,12288,0.040345601240793866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,16384,0.0519157330195109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,10240,0.03365653355916341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,7168,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,8192,0.02757866581281026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,6144,0.021014400323232017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,5120,0.0182751993338267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,65536,0.1955509344736735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,4096,0.01548479994138082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,3584,0.013677866260210673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,2560,0.010830932855606079
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,3072,0.012060800194740295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,2048,0.009373866518338521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,1536,0.007635200023651123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,1024,0.006293333570162455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,768,0.00584853341182073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,512,0.005037866532802582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,128,0.0041792000333468115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,64,0.0040224000811576845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,256,0.004763733347256978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,3072,32,0.003953066716591517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,10240,0.03003840049107869
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,16384,0.04608000119527181
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,12288,0.035019731521606444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,8192,0.024371200799942018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,7168,0.021241599321365358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,6144,0.018966400623321535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,4096,0.014072533448537192
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,65536,0.1718272050221761
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,5120,0.01650773286819458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,3584,0.012345600128173827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,2560,0.009897599617640179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,3072,0.011538133025169373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,2048,0.008725333213806152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,1536,0.00787306676308314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,1024,0.00660159985224406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,768,0.0058773333827654515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,512,0.005072000126043955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,128,0.0044064000248909
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,64,0.004343466460704803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,256,0.004794666667779287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2560,32,0.004436266422271728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,10240,0.02573546568552653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,16384,0.040210131804148355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,12288,0.03031146725018819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,8192,0.02108479936917623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,7168,0.01895786722501119
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,6144,0.01650773286819458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,4096,0.012537599603335062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,5120,0.014458666245142618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,65536,0.1473888079325358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,3584,0.01097920040289561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,3072,0.010356266299883525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,2048,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,2560,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,1536,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,768,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,1024,0.006293333570162455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,512,0.005038933455944061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,128,0.004377600053946177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,64,0.004430933296680451
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,256,0.004730666677157084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,2048,32,0.004163199911514918
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,10240,0.02232426603635152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,16384,0.033928533395131424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,12288,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,8192,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,7168,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,6144,0.014869333306948344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,65536,0.12718079884847006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,4096,0.01153600017229716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,5120,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,3584,0.00995306670665741
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,3072,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,2560,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,2048,0.007052800059318543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,1536,0.006262399752934774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,1024,0.005474133292833964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,768,0.004995200037956238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,512,0.004401066899299621
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,128,0.004008533308903376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,64,0.00365226666132609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,256,0.004247466723124186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1536,32,0.003640533238649368
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,10240,0.019578667481740315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,16384,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,12288,0.02321066657702128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,7168,0.014061866203943887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,8192,0.01630400021870931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,6144,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,65536,0.08444586594899496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,5120,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,4096,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,3584,0.008113066852092742
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,3072,0.007524266839027405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,2560,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,2048,0.006168533364931742
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,1536,0.005460266768932342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,768,0.004844800134499868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,512,0.004355200131734212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,128,0.0040554667512575785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,64,0.0036501333117485045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,256,0.003980800012747447
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,32,0.0039434666434923805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,16384,0.020331732432047524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,12288,0.019933867454528808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,8192,0.014074666301409402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,10240,0.0160970667997996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,65536,0.06481920083363851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,7168,0.012810666362444559
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,6144,0.011115733782450359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,5120,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,4096,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,3072,0.007052800059318543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,3584,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,2560,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,2048,0.0058559998869895935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,1024,0.004763733347256978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,1536,0.005578666428724925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,768,0.004334933559099833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,512,0.004075733323891958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,256,0.004051200052102407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,128,0.0035978667438030243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,64,0.0034847999612490333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,768,32,0.003929600119590759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,16384,0.018684800465901694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,12288,0.015892266233762106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,10240,0.0160863995552063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,8192,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,65536,0.04652373393376668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,7168,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,5120,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,6144,0.010307199756304423
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,4096,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,3584,0.007905066510041555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,2560,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,3072,0.007053866485754649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,1536,0.005691733459631602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,2048,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,1024,0.004802133142948151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,768,0.004397866626580557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,512,0.004026666780312856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,256,0.003962666789690653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,128,0.0036202666660149893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,64,0.0035402665535608927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,512,32,0.003550933301448822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,16384,0.014014933506647745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,12288,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,10240,0.010945066809654236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,65536,0.03379093408584595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,8192,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,7168,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,6144,0.010286933183670044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,4096,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,5120,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,3584,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,3072,0.0066442668437957765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,2560,0.006548266609509785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,2048,0.00581333339214325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,1536,0.004935466746489207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,1024,0.004789333542188009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,768,0.004456533491611481
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,512,0.004018133382002512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,128,0.0035616000493367515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,256,0.0036469332873821257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,64,0.003554133325815201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,256,32,0.0035018667578697203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,16384,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,12288,0.01069760024547577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,10240,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,8192,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,65536,0.025450666745503742
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,6144,0.008205866813659668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,7168,0.00862506628036499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,5120,0.00831573357184728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,4096,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,3584,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,2560,0.006189866860707601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,2048,0.005381333331267038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,3072,0.006607999900976817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,1536,0.00520000010728836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,1024,0.004163199911514918
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,768,0.004153600086768469
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,512,0.003673599908749262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,256,0.0035936000446478524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,128,0.0032106667757034303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,64,0.0032672000428040824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,128,32,0.0031786667803923286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,12288,0.008654933174451191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,16384,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,8192,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,10240,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,65536,0.022516266504923502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,7168,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,6144,0.007870933413505555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,4096,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,3584,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,5120,0.008282666901747386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,3072,0.007181866466999054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,2560,0.006985599795977275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,2048,0.005529599885145823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,1536,0.004917333523432413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,1024,0.00436160018046697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,768,0.004078933348258337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,512,0.00365226666132609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,256,0.003433600068092346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,64,0.0032170665760835014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,128,0.0032501332461833954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,64,32,0.0030975999931494398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,12288,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,16384,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,10240,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,8192,0.00862506628036499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,65536,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,7168,0.008283733328183492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,6144,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,5120,0.007521066566308339
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,4096,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,3072,0.007456000149250031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,3584,0.0074976002176602675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,2560,0.006985599795977275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,2048,0.0055637334783871974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,1024,0.004428799947102865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,1536,0.005051733553409576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,768,0.004063999901215235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,512,0.003956266740957896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,256,0.0035242666800816857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,128,0.003302400062481562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,64,0.003537066777547201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,32,32,0.003319466610749563
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,12288,0.522376537322998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,10240,0.42926826477050783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,16384,0.6811029434204101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,8192,0.35310932795206706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,6144,0.25975467363993326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,7168,0.3009888013203939
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,4096,0.17571840286254883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,5120,0.2233344078063965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,3584,0.15496212641398113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,2560,0.11540586948394775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,3072,0.133733336130778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,2048,0.09171626567840577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,1024,0.049628798166910806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,1536,0.0719871997833252
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,768,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,512,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,256,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,128,0.01753066579500834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,64,0.01568000018596649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,65536,32,0.015688533584276833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,12288,0.13329173723856608
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,16384,0.17278292973836262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,10240,0.11506346861521403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,8192,0.09021440347035727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,6144,0.06853866577148438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,7168,0.08116906483968099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,65536,0.6658762613932292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,5120,0.05789013306299845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,4096,0.04775360027949015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,3584,0.04171093304951985
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,3072,0.03631786505381267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,2560,0.031267199913660684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,1024,0.015554133057594299
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,1536,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,512,0.011108266313870747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,768,0.012410666545232136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,256,0.009946667154630025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,64,0.007895466685295106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,32,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,16384,0.1349290688832601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,12288,0.1019210656483968
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,65536,0.5041834513346355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,10240,0.08970239957173666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,8192,0.0702122688293457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,7168,0.06372693379720053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,5120,0.046011734008789065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,6144,0.05358933210372925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,3584,0.031948800881703696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,4096,0.0370688001314799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,3072,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,2560,0.024371200799942018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,2048,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,1536,0.016088533401489257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,1024,0.01267519990603129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,768,0.01039573351542155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,512,0.008738133311271667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,128,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,64,0.006676266590754191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,12288,32,0.006566399832566579
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,16384,0.11755519707997639
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,12288,0.08888320128122965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,65536,0.46564693450927735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,10240,0.07359146277109782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,8192,0.06075733502705892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,7168,0.05239466826121012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,6144,0.046147199471791585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,5120,0.03829760154088338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,4096,0.03174293239911397
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,3584,0.027716267108917236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,3072,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,2560,0.02066453297932943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,2048,0.017595734198888144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,1536,0.014075733224550881
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,1024,0.010806399583816528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,768,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,512,0.007835733393828075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,256,0.006701866785685222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,128,0.005789866546789805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,64,0.005475200215975444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,10240,32,0.0058229332168896995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,16384,0.09175039927164713
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,12288,0.06946240266164144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,65536,0.34676052729288737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,10240,0.05857280095418295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,8192,0.04642133315404256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,7168,0.04164266586303711
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,6144,0.03563520113627116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,5120,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,4096,0.02539413372675578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,3072,0.02032426595687866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,2560,0.017670400937398276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,2048,0.015677866339683533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,1536,0.012957866986592612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,1024,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,768,0.008589866757392883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,512,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,256,0.005825066566467285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,128,0.005406933526198069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,64,0.004972800115744273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,8192,32,0.006669866542021434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,16384,0.08581120173136393
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,12288,0.06485546827316284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,65536,0.3389098803202311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,768,1024,1024,0.004670933385690053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,10240,0.05444373289744059
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,7168,0.03809279998143514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,8192,0.04471360047658284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,6144,0.034065067768096924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,5120,0.02805759906768799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,4096,0.023894399404525757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,3584,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,3072,0.018478933970133463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,2560,0.016369066635767617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,2048,0.014042666554450989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,1536,0.01165226697921753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,768,0.007865599791208903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,1024,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,512,0.006669866542021434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,256,0.005485866467158
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,128,0.004695466657479604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,64,0.004668800036112467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,7168,32,0.004586666822433472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,16384,0.06809493700663248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,12288,0.05290559927622477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,8192,0.03618133465449015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,10240,0.04389546712239583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,65536,0.27607145309448244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,6144,0.02764799992243449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,7168,0.032151466608047484
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,5120,0.024233599503835045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,4096,0.019454934199651084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,3584,0.017867734034856163
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,3072,0.015827199816703795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,2560,0.014039466778437296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,2048,0.012641066312789917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,1536,0.010376532872517902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,1024,0.008035199840863545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,768,0.007077333331108093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,512,0.006234666705131531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,256,0.005469866593678792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,128,0.005086933573087057
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,64,0.004710400104522705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,6144,32,0.004995200037956238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,16384,0.06106453339258829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,12288,0.04485119978586833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,8192,0.031061333417892457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,10240,0.03918613195419311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,65536,0.22988692919413248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,7168,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,6144,0.024642133712768556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,5120,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,4096,0.016911999384562174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,3584,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,3072,0.01434879998366038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,2560,0.012437333663304646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,2048,0.011011200149854024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,1536,0.009467732906341553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,1024,0.007348266740640004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,512,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,768,0.006404266754786174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,256,0.005077333251635233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,128,0.0048320000370343525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,64,0.0043722664316495265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,5120,32,0.0042133331298828125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,16384,0.0516426682472229
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,12288,0.038365864753723146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,8192,0.026759467522303265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,10240,0.03345066706339518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,65536,0.19063466389973957
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,7168,0.023483733336130776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,6144,0.020207999149958293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,5120,0.01725119948387146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,4096,0.014245333274205527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,3584,0.01316373348236084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,3072,0.011583999792734782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,2560,0.01055999994277954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,2048,0.008932266632715862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,1536,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,1024,0.006260266900062561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,768,0.005448533097902933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,512,0.005062399804592133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,256,0.004588800172011057
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,64,0.004021333406368891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,128,0.004312533140182495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,4096,32,0.004398933549722036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,16384,0.046353065967559816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,12288,0.034542934099833174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,10240,0.03003840049107869
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,8192,0.023893332481384276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,65536,0.17080426216125488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,6144,0.0181386669476827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,7168,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,5120,0.01588586668173472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,4096,0.013289599617322286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,3584,0.012340266505877178
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,3072,0.011037866274515789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,2560,0.009810133775075277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,2048,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,1536,0.007077333331108093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,1024,0.005814399818579356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,768,0.005380266904830932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,512,0.0048885335524876915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,256,0.004264533519744873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,64,0.003905066599448522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,128,0.004082133372624716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3584,32,0.004164266586303711
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,16384,0.04355520009994507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,12288,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,10240,0.027988266944885255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,8192,0.02239039937655131
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,65536,0.1596757411956787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,6144,0.017729065815607705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,7168,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,5120,0.015613866845766702
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,4096,0.013187199831008911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,3584,0.012070399522781373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,3072,0.011043199896812439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,2560,0.009693866968154908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,2048,0.008316799998283386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,1536,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,1024,0.00584853341182073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,768,0.005857066810131073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,512,0.00537066658337911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,256,0.004710400104522705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,64,0.004380799829959869
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,128,0.004300799965858459
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,3072,32,0.004419200122356415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,16384,0.03515733480453491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,12288,0.026555732885996504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,10240,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,8192,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,65536,0.12888747056325275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,6144,0.01527253290017446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,7168,0.016849066813786825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,5120,0.013154133160909017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,4096,0.011959466338157653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,3584,0.010806399583816528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,3072,0.009532800316810608
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,2560,0.008646399776140849
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,2048,0.007835733393828075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,1536,0.006667733192443848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,1024,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,512,0.005276800195376078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,768,0.0050346667567888895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,256,0.00444160004456838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,128,0.004178133110205332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,64,0.003962666789690653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2560,32,0.004042666653792063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,16384,0.03010666569073995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,12288,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,10240,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,8192,0.016500266393025716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,65536,0.10222079753875732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,7168,0.014801067113876343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,6144,0.013357866803805032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,5120,0.011991467078526814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,3584,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,4096,0.01040000021457672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,3072,0.00871573289235433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,2560,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,2048,0.0067445332805315655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,1536,0.006190933287143707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,1024,0.005406933526198069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,512,0.004835199813048045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,768,0.004969599843025208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,256,0.004375466704368591
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,128,0.004377600053946177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,64,0.003927466770013174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,2048,32,0.004345599810282389
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,16384,0.028535467386245728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,12288,0.01952426632245382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,10240,0.017257599035898845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,8192,0.014860799908638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,65536,0.08529919783274333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,7168,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,6144,0.012198399504025776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,5120,0.011038933197657268
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,4096,0.009885866443316143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,3072,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,2560,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,2048,0.006600533425807953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,1024,0.005117866893609365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,1536,0.005791999896367391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,768,0.00487253318230311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,512,0.00443200021982193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,256,0.004091733445723852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,128,0.0038880000511805216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,64,0.003705599904060364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,32,0.0038762666285037995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,16384,0.0211626668771108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,12288,0.01986560026804606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,65536,0.05666133165359497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,10240,0.01609599987665812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,16384,2048,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,8192,0.014385066429773965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,7168,0.012344533205032348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,5120,0.010356266299883525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,6144,0.010774399836858113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,4096,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,3584,0.007828266421953837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,3072,0.007077333331108093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,2048,0.005868799984455109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,2560,0.006268799801667531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,1536,0.00518506666024526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,1024,0.004870399832725525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,768,0.004333866635958353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,256,0.003950933367013932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,128,0.0034688000877698263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,512,0.0037685332198937735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,64,0.0036288000643253326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1024,32,0.003566933423280716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,16384,0.019093332688013713
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,12288,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,65536,0.04973119894663493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,10240,0.015610667069753012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,8192,0.013572266697883606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,6144,0.01076693336168925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,5120,0.009272533655166625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,7168,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,4096,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,3584,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,3072,0.007086933155854543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,2560,0.006698666512966156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,2048,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,1536,0.005390933156013489
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,1024,0.004828799764315287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,768,0.0046186665693918865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,256,0.004069333275159201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,512,0.00429013321797053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,128,0.00360000009338061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,64,0.003703466554482778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,768,32,0.0034901333351929987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,16384,0.015338666240374246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,12288,0.014424533645311991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,65536,0.03406399885813395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,10240,0.0125408003727595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,8192,0.01276479959487915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,7168,0.011558399597803751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,6144,0.01069760024547577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,4096,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,5120,0.009130666653315227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,3584,0.007522133489449819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,3072,0.006677333513895671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,2048,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,2560,0.00626986672480901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,1536,0.005004799862702688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,1024,0.00481386681397756
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,768,0.004422399898370107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,256,0.003719466676314672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,512,0.0039488000174363455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,128,0.0035904000202814737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,32,0.0032831999162832894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,16384,0.011171199878056844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,12288,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,65536,0.024166399240493776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,10240,0.011627733707427979
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,8192,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,7168,0.009884799520174663
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,6144,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,5120,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,4096,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,3584,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,3072,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,2560,0.006200533111890157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,1536,0.004972800115744273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,2048,0.0054506664474805195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,1024,0.004334933559099833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,768,0.004346666733423868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,512,0.0039264000952243805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,256,0.003549866626660029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,128,0.0033728001018365227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,64,0.0032842665910720824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,256,32,0.003316266586383184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,16384,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,12288,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,65536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,10240,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,8192,0.008316799998283386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,7168,0.008191999793052674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,6144,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,5120,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,4096,0.007494399944941203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,3584,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,3072,0.006611200173695882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,2560,0.005825066566467285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,1536,0.0046304002404212955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,2048,0.005382399757703145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,1024,0.004163199911514918
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,768,0.004067199925581614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,512,0.0039264000952243805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,256,0.0035743998984495797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,128,0.0032287999987602235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,64,0.003102933367093404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,128,32,0.003202133377393087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,16384,0.009885866443316143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,12288,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,65536,0.015200000007947287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,10240,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,8192,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,7168,0.007850666840871174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,6144,0.007462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,5120,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,4096,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,3584,0.007085866729418437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,2560,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,3072,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,2048,0.006233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,1536,0.0046304002404212955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,1024,0.004364799956480662
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,768,0.004004266609748204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,512,0.003643733263015747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,256,0.0035466666022936503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,128,0.0032000000278155005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,32,0.0031295999884605407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,64,64,0.00308693324526151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,16384,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,65536,0.020068265994389854
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,12288,0.008691199620564779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,10240,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,8192,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,7168,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,6144,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,5120,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,4096,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,3584,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,3072,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,2560,0.006638933221499126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,2048,0.006611200173695882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,1536,0.0046634669105211895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,768,0.004101333270470301
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,1024,0.004335999985535939
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,512,0.003669333209594091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,256,0.0034773332377274835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,128,0.0031989333530267083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,64,0.0032138665517171226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,32,32,0.0031669333577156065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,12288,0.4138997395833333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,16384,0.5364394505818685
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,10240,0.34655574162801106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,8192,0.27224852244059244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,7168,0.24432746569315592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,6144,0.2057898680369059
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,5120,0.17701652844746907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,4096,0.13974186579386394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,3584,0.12731626828511555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,3072,0.10752000013987224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,2560,0.09291093349456787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,2048,0.07383039792378744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,1536,0.05809280077616373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,1024,0.039937067031860354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,768,0.032494932413101196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,512,0.02368853290875753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,256,0.016713599363962807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,64,0.015609600146611533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,128,0.014459733168284097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,65536,32,0.01601920028527578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,16384,0.14178986549377443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,12288,0.10693973700205486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,65536,0.5276330629984538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,10240,0.1027786652247111
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,8192,0.08249920209248861
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,7168,0.07342186768849691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,6144,0.06277333498001099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,5120,0.05369066794713338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,3584,0.03891199827194214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,4096,0.042872532208760576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,3072,0.033928533395131424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,2560,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,2048,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,1536,0.01842133402824402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,1024,0.0139957328637441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,768,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,512,0.009751466910044353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,256,0.00787199983994166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,128,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,64,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,16384,32,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,16384,0.10830399990081788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,12288,0.08185173670450846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,65536,0.41232961018880204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,10240,0.07509333292643229
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,8192,0.060931201775868735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,6144,0.04656000137329101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,5120,0.0392522652943929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,4096,0.03242666721343994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,3584,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,1536,3584,0.009333333373069764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,3072,0.02512213389078776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,2560,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,2048,0.017465599377950034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,1536,0.014385066429773965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,768,0.009577600161234538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,1024,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,256,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,128,0.005202133456865946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,64,0.0048981333772341405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,32,0.00499839981396993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,16384,0.0886080026626587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,12288,0.06720853646596273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,65536,0.35085439682006836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,10240,0.056694400310516355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,8192,0.04683200120925903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,7168,0.04089173475901286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,5120,0.03031040032704671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,6144,0.0362496018409729
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,4096,0.02532586654027303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,3072,0.019844265778859456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,2560,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,2048,0.01527253290017446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,1024,0.01042133371035258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,1536,0.012854400277137756
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,768,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,512,0.007052800059318543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,256,0.005884799857934316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,128,0.0054613331953684485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,64,0.005060266455014547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,10240,32,0.0065760001540184024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,16384,0.08195412953694661
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,65536,0.30317227045694983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,12288,0.062054399649302164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,10240,0.05225919882456461
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,8192,0.043348264694213864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,7168,0.03781973520914714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,5120,0.02839786609013875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,6144,0.03358826637268066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,4096,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,3584,0.020811732610066733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,3072,0.01815999945004781
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,2560,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,2048,0.013634133338928222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,1536,0.01183146635691325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,1024,0.009127466877301534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,512,0.006669866542021434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,768,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,256,0.005883733431498209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,128,0.005154133339722951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,512,512,64,0.003239466746648153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,64,0.00499839981396993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,8192,32,0.005196799834569296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,16384,0.06849706967671712
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,12288,0.05294293165206909
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,10240,0.04423679908116658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,65536,0.2651466687520345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,7168,0.032014934221903484
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,8192,0.037138132254282634
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,6144,0.028467200199762982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,5120,0.023961599667867026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,4096,0.01964799960454305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,3584,0.01772800087928772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,3072,0.015410133202870688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,2560,0.013741866747538248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,2048,0.011991467078526814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,1536,0.010016000270843506
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,768,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,512,0.005884799857934316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,1024,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,256,0.005308799942334493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,128,0.004586666822433472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,64,0.004459733267625173
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,7168,32,0.0045525332291920986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,12288,0.04833279848098755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,16384,0.06298986673355103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,65536,0.23599786758422853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,10240,0.04096000194549561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,8192,0.03372373183568318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,6144,0.026213334004084272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,5120,0.02218773365020752
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,4096,0.0182751993338267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,3584,0.01637333333492279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,3072,0.014860799908638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,2560,0.012888532876968384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,2048,0.011480533083279927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,1024,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,768,0.006223999957243601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,512,0.005036800106366476
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,256,0.004789333542188009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,128,0.004342400034268697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,64,0.003990400085846583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,32,0.004033066580692927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,16384,0.05474880139032999
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,65536,0.20538026491800943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,12288,0.04198400179545085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,10240,0.035702399412790936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,8192,0.029423999786376952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,7168,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,5120,0.01936639944712321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,6144,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,4096,0.01609173317750295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,3584,0.014801067113876343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,3072,0.013416533668835958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,2560,0.01183146635691325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,2048,0.01030613382657369
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,1536,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,1024,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,512,0.005471999943256378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,768,0.006200533111890157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,256,0.00484799991051356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,128,0.0044725333650906885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,64,0.004141866664091746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,5120,32,0.004137599964936575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,16384,0.04348586797714234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,65536,0.15960639317830402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,12288,0.03317866722742717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,10240,0.0284661332766215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,8192,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,7168,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,5120,0.015884799758593242
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,6144,0.018117332458496095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,4096,0.013448533415794373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,3584,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,3072,0.011310933033625285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,2560,0.009955199559529622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,2048,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,1536,0.007157333195209503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,1024,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,512,0.005378133555253347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,768,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,256,0.004710400104522705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,128,0.004489600161711375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,64,0.004347733159859975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,4096,32,0.004297600189844767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,16384,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,65536,0.13984427452087403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,12288,0.028125866254170732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,10240,0.024167466163635253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,8192,0.01986560026804606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,7168,0.017593600352605186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,5120,0.0135861337184906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,6144,0.01548479994138082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,4096,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,3584,0.01058240036169688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,3072,0.010013866424560546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,2560,0.008794666330019633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,2048,0.007863466441631318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,1536,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,1024,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,512,0.004679466784000397
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,768,0.004970666766166687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,256,0.004399999976158142
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,128,0.004092800120512644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,64,0.004120533416668574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3584,32,0.004069333275159201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,16384,0.0373418649037679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,65536,0.1360223929087321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,12288,0.028604799509048463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,10240,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,8192,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,7168,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,5120,0.014281599720319112
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,6144,0.016032000382741295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,4096,0.01225493351618449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,3584,0.011128532886505126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,3072,0.00997866690158844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,2560,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,2048,0.007931733131408691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,1536,0.006611200173695882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,1024,0.005474133292833964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,512,0.004753066599369049
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,768,0.005015466610590617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,256,0.004275199770927429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,128,0.003975466638803482
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,64,0.0036533333361148832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,3072,32,0.003576533248027166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,16384,0.037478399276733396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,65536,0.11216213703155517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,12288,0.02723840077718099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,10240,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,8192,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,7168,0.017318399747212727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,5120,0.013974400361378989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,6144,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,4096,0.010377599795659383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,3584,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,3072,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,2560,0.007496533294518788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,2048,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,1536,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,1024,0.0054400001962979635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,512,0.004779733220736186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,768,0.005017599960168203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,256,0.004329599936803182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,128,0.004071466624736786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,64,0.003764266769091288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2560,32,0.004029866556326548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,16384,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,65536,0.10124053160349529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,12288,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,10240,0.01813973387082418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,7168,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,8192,0.015201066931088766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,6144,0.0128330667813619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,5120,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,12288,7168,0.05451200008392334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,4096,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,3584,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,3072,0.00831573357184728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,2560,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,2048,0.006607999900976817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,1024,0.005096533397833506
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,1536,0.005789866546789805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,512,0.00446720023949941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,256,0.003925333420435587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,768,0.004871466755867004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,128,0.0039818666875362395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,64,0.003960533440113068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,2048,32,0.003907199949026108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,16384,0.02505279978116353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,12288,0.020670932531356812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,10240,0.016577066977818807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,65536,0.07321600119272867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,8192,0.01418560047944387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,6144,0.011879466970761617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,7168,0.013090133666992188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,5120,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,4096,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,3584,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,3072,0.007157333195209503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,2560,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,2048,0.005858133236567179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,1024,0.004817066589991251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,768,0.004334933559099833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,1536,0.0054954667886098225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,512,0.00408746674656868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,256,0.003929600119590759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,128,0.00359253336985906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,64,0.003517866631348928
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1536,32,0.0035360001027584078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,16384,0.019504000743230186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,12288,0.01657386620839437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,8192,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,65536,0.05584213336308798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,10240,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,5120,0.010013866424560546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,7168,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,6144,0.01090773344039917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,4096,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,3584,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,3072,0.007052800059318543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,2560,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,2048,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,1536,0.005382399757703145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,1024,0.004874666531880697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,768,0.004795733094215393
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,256,0.003952000041802724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,512,0.004131199916203817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,128,0.003706666578849157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,64,0.0036458666125933326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,1024,32,0.003619199991226196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,16384,0.01602453291416168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,12288,0.013585066795349121
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,65536,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,10240,0.013994666934013366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,7168,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,8192,0.013195733229319254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,6144,0.010833066701889039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,5120,0.009136000275611877
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,4096,0.007906133433183034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,3584,0.007485866546630859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,3072,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,2048,0.005782400071620941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,2560,0.006267733375231425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,1536,0.005003733436266581
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,1024,0.004735999802748362
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,768,0.004375466704368591
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,512,0.004012800008058548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,256,0.0037269333998362223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,128,0.00348693331082662
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,64,0.003189333279927572
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,768,32,0.003550933301448822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,12288,0.012469333410263062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,16384,0.014791466792424521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,10240,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,8192,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,65536,0.03317760030428569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,7168,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,6144,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,5120,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,4096,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,3584,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,3072,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,2560,0.006190933287143707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,2048,0.005414400001366933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,1536,0.005268266797065735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,1024,0.004770133395989736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,768,0.004407466451327006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,256,0.0036576000352700555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,512,0.004042666653792063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,128,0.0034634667138258614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,64,0.00360959991812706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,512,32,0.003521066655715307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,16384,0.012970667084058127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,12288,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,65536,0.022665599981943764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,10240,0.009946667154630025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,7168,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,8192,0.009054932991663616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,6144,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,5120,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,3584,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,4096,0.007906133433183034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,3072,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,2560,0.005852800110975901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,2048,0.005526400109132131
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,1536,0.004632533093293508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,1024,0.004407466451327006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,768,0.004138666639725367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,512,0.00391146664818128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,256,0.0035616000493367515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,64,0.003078400095303853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,128,0.003209600100914637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,256,32,0.0032266666491826378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,12288,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,16384,0.009885866443316143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,65536,0.019715199867884316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,10240,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,8192,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,6144,7168,0.029765333731969195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,6144,0.00793280005455017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,7168,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,5120,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,3584,0.0074527998765309645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,4096,0.007589333256085714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,3072,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,1536,0.004780800143877665
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,2560,0.005857066810131073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,2048,0.0056320001681645715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,1024,0.004366933306058248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,768,0.004095999896526337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,256,0.003533866753180822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,128,0.003209600100914637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,512,0.0036757332583268487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,64,0.0032287999987602235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,128,32,0.0032927999893824257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,16384,0.009885866443316143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,12288,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,10240,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,65536,0.014837333559989929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,7168,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,6144,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,8192,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,5120,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,4096,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,3584,0.006704000135262807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,3072,0.006265600025653839
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,2560,0.00664213349421819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,2048,0.00639573335647583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,1536,0.004833066463470459
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,768,0.004037333279848098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,1024,0.004390400151411692
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,512,0.003980800012747447
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,256,0.003602133442958196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,128,0.003160533308982849
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,32,0.00315733328461647
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,64,64,0.0031008000175158186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,16384,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,12288,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,10240,0.007850666840871174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,65536,0.01693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,7168,0.008306133250395458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,8192,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,5120,0.0074527998765309645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,6144,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,4096,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,3584,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,3072,0.00697920024394989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,2048,0.006602666775385539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,2560,0.006713599960009258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,1536,0.004710400104522705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,1024,0.004410666724046072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,768,0.004042666653792063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,256,0.003389866650104523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,512,0.003605333218971888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,128,0.003218133250872294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,64,0.003190399954716364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,384,32,32,0.0032437334458033243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,8192,0.21910187403361
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,10240,0.26289493242899575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,12288,0.36259838740030925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,16384,0.4885439872741699
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,5120,0.13728426297505697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,7168,0.18927040100097656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,6144,0.160698668162028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,4096,0.10876266956329346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,2560,0.06912000179290771
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,3072,0.08416000207265219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,3584,0.09577813148498535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,2048,0.05789013306299845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,1536,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,768,0.023912533124287923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,1024,0.02997013330459595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,512,0.01794346570968628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,256,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,128,0.01179093321164449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,64,0.011282133062680562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,65536,32,0.012036266922950744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,12288,0.08304533163706461
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,16384,0.1102463960647583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,10240,0.06881279945373535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,8192,0.05789013306299845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,7168,0.04918293158213298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,6144,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,5120,0.037138132254282634
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,4096,0.03051519989967346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,65536,0.4030463854471843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,3584,0.027237333854039508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,3072,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,2048,0.01761386593182882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,2560,0.021277866760889688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,768,0.009946667154630025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,1024,0.01118293305238088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,1536,0.014357333381970724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,256,0.005806933343410492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,128,0.0054058666030565895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,64,0.005037866532802582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,16384,32,0.006676266590754191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,12288,0.05949333508809408
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,16384,0.07782399654388428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,10240,0.050279466311136875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,8192,0.04177920023600261
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,7168,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,6144,0.03181119958559672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,65536,0.28897279103597007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,5120,0.027576533953348796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,3072,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,3584,0.020125865936279297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,2560,0.015612799922625223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,2048,0.013229866822560629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,1536,0.011379200220108032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,768,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,1024,0.009410132964452107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,512,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,256,0.005543466905752818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,128,0.004995200037956238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,32,0.0046293333172798155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,12288,64,0.004744533201058706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,12288,0.05157653490702311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,16384,0.06756800015767415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,10240,0.043350398540496826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,7168,0.031198932727177935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,8192,0.03618133465449015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,65536,0.24664533933003746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,6144,0.027646932999293012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,5120,0.02389226754506429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,4096,0.019523199399312338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,3584,0.017407999436060587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,3072,0.015414399902025857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,2560,0.013699199755986533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,2048,0.011947733163833619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,1536,0.010012800494829815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,1024,0.008282666901747386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,768,0.006701866785685222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,512,0.005415466427803039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,256,0.004996266464392344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,64,0.0044159998496373495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,32,0.0045962666471799215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,10240,128,0.004746666550636292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,12288,0.043961600462595625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,16384,0.05700266758600871
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,10240,0.03734079996744792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,65536,0.2113866647084554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,8192,0.03126506606737773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,6144,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,5120,0.01945706605911255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,4096,0.0160970667997996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,3584,0.01452906628449758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,3072,0.013018666704495748
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,2560,0.011763200163841248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,1536,0.008990933497746784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,2048,0.010295466581980387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,1024,0.0066442668437957765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,768,0.005645866692066193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,512,0.005220266679922739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,256,0.004571733375390371
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,128,0.004351999859015147
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,32,0.004252799848715464
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,64,0.004014933357636133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,16384,0.05208853483200073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,12288,0.03898239930470784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,65536,0.1865066687266032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,10240,0.03386346499125163
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,8192,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,7168,0.024301866690317787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,6144,0.021502933899561563
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,5120,0.017873066663742065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,4096,0.014860799908638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,3584,0.013434666395187377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,2560,0.010796800255775452
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,3072,0.012036266922950744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,2048,0.009613866607348125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,1536,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,1024,0.005924266576766968
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,768,0.005106133222579956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,512,0.004744533201058706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,128,0.004469333092371622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,256,0.004430933296680451
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,64,0.003944533318281174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,7168,32,0.0042453333735466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,16384,0.04687146743138631
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,12288,0.03618133465449015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,65536,0.1719626744588216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,8192,0.025600000222524004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,7168,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,5120,0.016849066813786825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,6144,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,4096,0.014383999506632486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,3584,0.012955733140309653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,3072,0.01181013286113739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,2560,0.010698666175206501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,2048,0.009474133451779682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,1024,0.006704000135262807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,1536,0.007426133255163829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,768,0.005857066810131073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,512,0.005064533154169718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,256,0.004844800134499868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,128,0.004253866771856943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,64,0.003986133386691412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,6144,32,0.004419200122356415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,16384,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,12288,0.030242133140563964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,65536,0.1456160068511963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,10240,0.02566933234532674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,6144,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,7168,0.018911999464035035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,8192,0.02135466734568278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,5120,0.014179199934005737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,4096,0.012443733215332032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,3584,0.011525332927703857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,3072,0.010356266299883525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,2560,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,2048,0.008316799998283386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,1536,0.007114666700363159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,1024,0.005791999896367391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,512,0.004619733492533366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,768,0.0054954667886098225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,256,0.004358399907747904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,128,0.004380799829959869
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,32,0.004042666653792063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,5120,64,0.003940266619126002
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,16384,0.033928533395131424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,12288,0.02573653260866801
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,65536,0.11335786978403728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,10240,0.022322134176890055
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,8192,0.018145066499710084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,7168,0.016158933440844216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,6144,0.014595199624697366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,5120,0.012834133704503379
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,4096,0.011240532994270325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,3584,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,2560,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,3072,0.009683199723561605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,2048,0.007427200178305308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,1536,0.006291200220584869
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,1024,0.005376000205675761
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,512,0.004819199939568837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,256,0.004827733337879181
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,128,0.003925333420435587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,32,0.004098133246103922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,64,0.003974399964014689
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,16384,0.030583467086156207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,65536,0.10328746636708577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,12288,0.023347200949986775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,10240,0.020002132654190062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,8192,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,7168,0.014794666568438211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,5120,0.01165013313293457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,6144,0.013301333785057068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,4096,0.010214400291442872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,3584,0.009545600414276123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,3072,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,2560,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,2048,0.006942933301130931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,1024,0.004996266464392344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,1536,0.006198399762312571
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,768,0.004587733248869578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,512,0.004459733267625173
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,256,0.0037632000943024955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,128,0.003673599908749262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,64,0.0036138666172822317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3584,32,0.003937066594759623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,65536,0.09410560131072998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,16384,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,12288,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,10240,0.018487467368443807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,8192,0.015545599659283958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,7168,0.014014933506647745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,6144,0.012812800208727517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,5120,0.011332266529401143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,4096,0.009966933727264404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,3072,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,3584,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,2560,0.0072170664866765336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,2048,0.006234666705131531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,1536,0.005847466488679251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,768,0.004619733492533366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,512,0.004177066683769226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,256,0.003803733239571253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,128,0.004019200056791306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,64,0.003623466690381368
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,32,0.0037674665451049804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,65536,0.07533226807912191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,16384,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,12288,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,8192,0.015204266707102457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,7168,0.013771733641624451
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,6144,0.012407466769218445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,5120,0.011175466577212016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,4096,0.009583999713261921
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,3584,0.00871573289235433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,3072,0.007909333209196727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,2560,0.007216000060240428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,2048,0.006187733511130015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,1536,0.005782400071620941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,1024,0.004997333387533823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,768,0.004588800172011057
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,512,0.004212266703446706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,256,0.0038912000755469004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,128,0.0036821333070596062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,64,0.00363520011305809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2560,32,0.0035232000052928926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,65536,0.06277226607004802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,16384,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,12288,0.02095680038134257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,10240,0.016569599509239197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,8192,0.01430400013923645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,7168,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,6144,0.011787733435630799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,5120,0.010615467031796774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,4096,0.009193600217501322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,3584,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,3072,0.007524266839027405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,2560,0.006667733192443848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,2048,0.005783466498057047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,1536,0.005407999952634176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,1024,0.004624000191688538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,768,0.0042453333735466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,512,0.003835733234882355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,256,0.003861333429813385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,128,0.003881600002447764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,64,0.0036170666416486105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,2048,32,0.0039381332695484165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,65536,0.04928853511810303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,16384,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,12288,0.017387733856836955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,10240,0.015613866845766702
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,8192,0.01383786698182424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,7168,0.01252906620502472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,6144,0.0114464004834493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,5120,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,4096,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,3584,0.007968000074227651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,3072,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,2560,0.006600533425807953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,2048,0.005885866781075796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,1536,0.005373866856098175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,1024,0.00477866679430008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,768,0.004211199780305227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,512,0.004145066688458125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,256,0.003907199949026108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,128,0.003565866748491923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,64,0.003553066651026408
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1536,32,0.003550933301448822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,65536,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,16384,0.015681067109107973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,12288,0.01397333343823751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,10240,0.01281599998474121
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,8192,0.013620266318321228
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,7168,0.011995733777681986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,6144,0.010822400450706482
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,5120,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,8192,7168,0.027239465713500978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,4096,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,3584,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,3072,0.006702933212121327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,2560,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,2048,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,1536,0.005299200117588043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,1024,0.004835199813048045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,768,0.004354133208592733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,512,0.003923200070858002
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,256,0.003647999962170919
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,128,0.003491200009981791
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,64,0.0032618666688601174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,1024,32,0.0032672000428040824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,16384,0.014792533715566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,65536,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,12288,0.012813867131868998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,10240,0.011822932958602905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,8192,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,7168,0.00981119970480601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,6144,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,5120,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,4096,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,3584,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,3072,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,2560,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,2048,0.0054400001962979635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,1536,0.005050666630268097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,1024,0.004587733248869578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,768,0.004386133452256521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,512,0.004025600105524063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,256,0.003748266647259394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,128,0.0035445332527160645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,64,0.003337600082159042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,768,32,0.003491200009981791
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,16384,0.011958400408426922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,65536,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,12288,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,10240,0.012436266740163167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,8192,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,7168,0.009944533308347065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,6144,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,5120,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,4096,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,3584,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,3072,0.0066336000959078475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,2560,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,2048,0.005469866593678792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,1536,0.004957866668701172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,1024,0.004369066655635833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,768,0.00436160018046697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,512,0.003962666789690653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,256,0.003607466568549474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,128,0.003324799984693527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,64,0.003289599965016047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,512,32,0.0031295999884605407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,16384,0.010354133447011311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,65536,0.017113600174585977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,12288,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,10240,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,8192,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,7168,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,6144,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,5120,0.00830506682395935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,4096,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,3584,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,3072,0.006637866795063019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,2560,0.006223999957243601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,2048,0.005398400127887726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,1536,0.00508480022350947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,1024,0.004349866509437561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,768,0.004331733286380768
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,512,0.003939199944337209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,256,0.0036298667391141256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,128,0.00325546662012736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,64,0.003201066702604294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,4096,768,0.004937600096066793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,256,32,0.003219199925661087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,12288,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,16384,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,65536,0.015681067109107973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,10240,0.009128533800443013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,8192,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,7168,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,6144,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,4096,0.007522133489449819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,5120,0.00824533353249232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,3584,0.007115733126799266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,3072,0.007011199990908305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,2560,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,2048,0.006295466423034668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,1536,0.004830933113892873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,1024,0.004324266811211904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,768,0.004014933357636133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,512,0.00365226666132609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,256,0.0035573333501815797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,128,0.003271466741959254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,64,0.003256533294916153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,128,32,0.0031776001056035364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,16384,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,12288,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,65536,0.014484266440073649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,10240,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,8192,0.007394133508205414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,7168,0.007012266914049785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,6144,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,5120,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,4096,0.007012266914049785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,3584,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,3072,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,2560,0.006702933212121327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,2048,0.0066336000959078475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,1536,0.004676266511281332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,1024,0.004354133208592733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,768,0.004062933226426443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,512,0.0035914666950702667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,256,0.0034122665723164878
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,128,0.0032170665760835014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,32,0.003125333289305369
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,64,64,0.0031871999303499854
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,16384,0.009195733070373534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,12288,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,65536,0.014249599973360696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,10240,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,8192,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,7168,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,6144,0.00694400022427241
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,5120,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,4096,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,3584,0.006705066561698914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,3072,0.0065760001540184024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,2560,0.006704000135262807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,2048,0.0062943999965985615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,1024,0.0044149334232012425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,1536,0.0045962666471799215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,768,0.003933866570393244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,512,0.0036288000643253326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,256,0.0034986667335033415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,128,0.0032245332996050516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,64,0.0032448001205921174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,32,32,0.003193599979082743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,256,3072,1024,0.004982399940490723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,10240,0.2353216012318929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,12288,0.3018069267272949
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,16384,0.4107263882954915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,8192,0.19034773508707684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,7168,0.16486399968465168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,6144,0.14349652926127116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,5120,0.11842453479766846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,4096,0.09765546321868897
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,3584,0.08659626642862955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,3072,0.07429760297139486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,2560,0.06287360191345215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,2048,0.052292267481486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,1024,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,1536,0.039867734909057616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,768,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,256,0.014890666802724203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,128,0.011892267068227132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,64,0.009946667154630025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,512,0.016847999890645345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,65536,32,0.01267519990603129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,16384,0.10557440121968586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,12288,0.07618666489919027
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,10240,0.06540053288141887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,8192,0.05512533187866211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,7168,0.04642133315404256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,6144,0.0408949335416158
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,65536,0.3814741452534994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,5120,0.035225598017374675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,3584,0.026077866554260254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,4096,0.02908266584078471
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,3072,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,2560,0.019846399625142418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,2048,0.016428800423940022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,1024,0.010739200313886007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,1536,0.013230933745702108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,768,0.009063466389973959
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,512,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,256,0.005355733136336008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,64,0.00499839981396993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,128,0.004771199822425842
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,16384,32,0.005212800204753875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,16384,0.07479360103607177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,10240,0.048674134413401286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,12288,0.05577280124028524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,8192,0.040549333890279135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,7168,0.034746666749318436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,65536,0.27921066284179685
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,6144,0.031060266494750976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,4096,0.02223466634750366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,5120,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,3584,0.01972800095876058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,3072,0.017258665959040322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,2048,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,2560,0.01527253290017446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,1536,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,768,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,1024,0.008724266290664673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,512,0.005627733469009399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,256,0.005051733553409576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,128,0.004428799947102865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,32,0.004433066646258036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,12288,64,0.004409599800904592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,12288,0.05628586610158285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,16384,0.08123733202616373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,10240,0.051780267556508386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,8192,0.0395957350730896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,7168,0.036183468500773114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,65536,0.3028319994608561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,6144,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,4096,0.0234826664129893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,5120,0.02648746569951375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,3584,0.021230934063593547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,3072,0.01848533352216085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,2560,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,2048,0.013290666540463767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,1536,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,768,0.0066655998428662615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,1024,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,512,0.005883733431498209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,256,0.005073066552480062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,128,0.004817066589991251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,32,0.004362666606903076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,10240,64,0.004374399781227112
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,16384,0.05358933210372925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,12288,0.03993599812189738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,10240,0.03502080043156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,65536,0.19425279299418133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,8192,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,7168,0.025260800123214723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,6144,0.022312533855438233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,5120,0.019320533672968546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,4096,0.016089600324630738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,3584,0.01444906691710154
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,2560,0.011556266744931539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,3072,0.012820266683896384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,2048,0.010389332969983418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,1536,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,1024,0.006883200009663899
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,512,0.004587733248869578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,256,0.0043818667531013485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,768,0.0055637334783871974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,64,0.004496000210444133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,128,0.004253866771856943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,8192,32,0.004458666841189066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,10240,0.03283413251241048
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,12288,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,16384,0.04993600050608317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,65536,0.17667412757873535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,6144,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,8192,0.0271509329477946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,7168,0.023893332481384276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,4096,0.015403733650843302
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,3584,0.013698133826255798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,3072,0.012409599622090657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,5120,0.018077866236368815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,2560,0.011310933033625285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,2048,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,1536,0.007906133433183034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,1024,0.007156266768773396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,768,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,512,0.0054058666030565895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,256,0.004428799947102865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,128,0.004062933226426443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,64,0.003982933362325033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,7168,32,0.0039989332358042395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,12288,0.0373418649037679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,10240,0.03221866687138875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,16384,0.04857279856999715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,65536,0.18042880694071453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,8192,0.02696640094121297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,7168,0.023600000143051147
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,6144,0.020946133136749267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,5120,0.01775040030479431
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,4096,0.01486186683177948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,3584,0.013635200262069703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,2560,0.01071573297182719
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,3072,0.012013866504033407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,2048,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,1536,0.00786240001519521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,1024,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,512,0.004743466774622599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,256,0.004369066655635833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,768,0.005633066594600678
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,128,0.004211199780305227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,64,0.0036778666079044344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,6144,32,0.003804799914360046
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,12288,0.0355679988861084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,16384,0.04573866526285807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,10240,0.030583467086156207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,65536,0.14793386459350585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,8192,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,6144,0.019827200969060262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,7168,0.022259199619293214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,4096,0.014314666390419006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,5120,0.016850133736928306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,3584,0.013155200084050498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,3072,0.011659733454386393
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,2560,0.010357333223025005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,1536,0.0074527998765309645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,1024,0.005449600021044413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,2048,0.009134933352470398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,768,0.005339733262856802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,512,0.005193600058555603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,256,0.004322133461634318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,128,0.00403413325548172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,64,0.0037237333754698435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,5120,32,0.004035199930270513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,10240,0.024621866146723428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,16384,0.037752532958984376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,65536,0.11154452959696452
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,7168,0.018201599518458046
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,6144,0.016574933131535848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,5120,0.014801067113876343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,4096,0.011990400155385335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,3584,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,2560,0.007768533130486806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,3072,0.008726400136947633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,2048,0.007114666700363159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,1536,0.005700266857941946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,1024,0.004836266736189524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,768,0.004457599918047587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,512,0.004411733150482178
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,256,0.004070399949947992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,128,0.004009599983692169
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,32,0.0037685332198937735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,4096,64,0.0036906667053699495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,16384,0.040003200372060135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,12288,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,65536,0.13752320607503254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,10240,0.025521065791447955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,8192,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,7168,0.01909546653429667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,6144,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,5120,0.01483519971370697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,4096,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,3584,0.012061867117881774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,3072,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,1536,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,2048,0.006637866795063019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,2560,0.0074986666440963745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,1024,0.004841599861780802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,768,0.005029333134492239
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,512,0.004369066655635833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,128,0.003977599988381068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,256,0.004056533426046371
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,64,0.0035861333211263022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3584,32,0.0038986665507157645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,16384,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,12288,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,10240,0.017805866400400796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,65536,0.09376426537831625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,7168,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,6144,0.012342400352160136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,8192,0.014935466647148132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,5120,0.011240532994270325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,4096,0.009944533308347065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,3584,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,2560,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,3072,0.008281599978605907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,2048,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,1024,0.004880000154177348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,1536,0.005381333331267038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,768,0.00458133320013682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,512,0.004145066688458125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,256,0.00395413339138031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,128,0.00360959991812706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,32,0.0035818666219711304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,3072,64,0.003589333345492681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,16384,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,12288,0.024166399240493776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,65536,0.09437867005666098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,10240,0.016847999890645345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,8192,0.014564266800880432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,7168,0.013220266501108805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,6144,0.012301866213480632
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,5120,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,4096,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,3584,0.009060266613960265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,3072,0.008274133503437042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,2048,0.006612266600131989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,2560,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,1536,0.005851733187834421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,1024,0.005320533116658529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,768,0.004858666658401489
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,256,0.00395413339138031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,512,0.004524800181388855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,128,0.003978666663169861
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,64,0.003519999980926514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2560,32,0.0035349334279696143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,16384,0.02305493354797363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,10240,0.01725333333015442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,12288,0.018966400623321535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,65536,0.06567146778106689
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,8192,0.014450132846832275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,7168,0.012949333588282267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,6144,0.011557333668073018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,4096,0.00902400016784668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,5120,0.010326400399208069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,3584,0.008306133250395458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,3072,0.007495466868082683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,2560,0.006258133550484974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,1536,0.005032533407211303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,2048,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,1024,0.004725333551565806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,768,0.004491733511288961
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,512,0.00407679999868075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,128,0.003642666588226954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,256,0.004339199761549632
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,64,0.003626666714747747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,2048,32,0.0035914666950702667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,12288,0.016294399897257485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,10240,0.014860799908638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,16384,0.01800640026728312
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,65536,0.05184746583302816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,8192,0.014108799894650779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,7168,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,6144,0.011115733782450359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,5120,0.010295466581980387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,4096,0.008682666222254436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,3584,0.00783253312110901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,2560,0.006232533355553945
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,3072,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,1536,0.005066666503747304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,2048,0.005850666761398315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,1024,0.004779733220736186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,768,0.004343466460704803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,512,0.0040618665516376495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,256,0.003656533360481262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,128,0.003555200000603994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,32,0.003601066768169403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1536,64,0.0033514666060606635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,65536,0.03816106716791789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,16384,0.015210666259129844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,12288,0.013152000308036805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,10240,0.01234346628189087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,6144,0.011059199770291645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,8192,0.011150933305422465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,7168,0.010310399532318115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,5120,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,3584,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,3072,0.006677333513895671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,2048,0.005510400235652924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,2560,0.006201600035031637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,1536,0.004970666766166687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,1024,0.00484799991051356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,512,0.003984000037113826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,768,0.004392533500989278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,256,0.0036757332583268487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,128,0.003525333354870478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,64,0.003219199925661087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,32,0.0035584000249703727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,12288,0.014451199769973755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,16384,0.01691626707712809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,65536,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,10240,0.01276693344116211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,7168,0.010739200313886007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,8192,0.011116799712181092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,6144,0.009810133775075277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,5120,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,4096,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,3584,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,3072,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,2560,0.005858133236567179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,2048,0.005782400071620941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,1536,0.005017599960168203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,768,0.004330666859944662
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,1024,0.004448000093301137
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,512,0.003939199944337209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,256,0.0036415999134381616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,64,0.003234133372704188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,128,0.0032298666735490165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,768,32,0.003205333401759466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,12288,0.011177600423494975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,16384,0.013506133357683817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,65536,0.02409706711769104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,10240,0.010356266299883525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,7168,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,8192,0.009408000111579894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,6144,0.008237866560618083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,5120,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,4096,0.007874133189519246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,3584,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,3072,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,2560,0.005849599838256836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,2048,0.005438933273156484
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,1536,0.004660266637802124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,768,0.004073599974314371
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,1024,0.004349866509437561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,512,0.003947733342647553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,256,0.0036576000352700555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,64,0.0032416000962257386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,128,0.0032437334458033243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,512,32,0.003319466610749563
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,16384,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,12288,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,65536,0.020275199413299562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,8192,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,10240,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,7168,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,6144,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,4096,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,5120,0.008317866424719492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,3584,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,3072,0.007084799806276958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,2560,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,2048,0.00537066658337911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,1536,0.004877866804599762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,768,0.004106666644414266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,1024,0.0044149334232012425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,512,0.0036938667297363283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,256,0.0035957333942254386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,128,0.0032149332265059153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,64,0.0031957333286603295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,256,32,0.0031925333042939507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,16384,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,12288,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,65536,0.015448533495267234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,10240,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,8192,0.008683733145395915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,7168,0.008282666901747386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,6144,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,5120,0.007386666536331177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,3584,0.006677333513895671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,3072,0.006704000135262807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,2560,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,2048,0.00660159985224406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,1024,0.004337066908677419
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,1536,0.0045621335506439206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,768,0.004006399959325791
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,512,0.0036906667053699495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,256,0.0037077332536379496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,128,0.003221333275238673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,64,0.003151999910672506
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,32,0.0032106667757034303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,16384,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,65536,0.014042666554450989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,12288,0.00804373323917389
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,10240,0.007795199751853943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,8192,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,7168,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,6144,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,5120,0.006669866542021434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,4096,0.006232533355553945
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,3584,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,2560,0.006738133231798808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,3072,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,2048,0.006293333570162455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,1536,0.0045621335506439206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,1024,0.004364799956480662
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,768,0.003944533318281174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,512,0.0037130666275819145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,256,0.00347626656293869
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,128,0.003223466624816259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,64,0.003138133386770884
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,64,32,0.0031530665854612983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,65536,0.013639466961224875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,16384,0.009127466877301534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,10240,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,12288,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,8192,0.007214933137098948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,7168,0.006612266600131989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,6144,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,5120,0.0065760001540184024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,4096,0.006292266647020976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,3584,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,3072,0.0066336000959078475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,2560,0.006200533111890157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,2048,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,1536,0.0046634669105211895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,1024,0.004379733403523763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,768,0.003992533435424169
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,512,0.0036629334092140196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,256,0.003533866753180822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,128,0.003293866664171219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,64,0.003094399968783061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,32,32,0.003070933371782303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,16384,0.3679231961568197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,12288,0.26719786326090494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,8192,0.1945258617401123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,10240,0.2379093329111735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,6144,0.14704640706380206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,7168,0.16609279314676922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,4096,0.09840640226999918
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,5120,0.12148053646087646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,3072,0.07461653550465902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,3584,0.08663040002187093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,2048,0.05290453433990479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,2560,0.06376106739044189
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,1536,0.040141868591308597
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,1024,0.028398933013280232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,768,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,512,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,256,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,128,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,64,0.008306133250395458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,65536,32,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,16384,0.10352533658345539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,12288,0.07618559996287028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,65536,0.3728384017944336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,10240,0.06533120075861612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,8192,0.054135465621948244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,7168,0.045875199635823566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,6144,0.040072532494862874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,5120,0.03515733480453491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,4096,0.028668800989786785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,3584,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,2560,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,2048,0.01608746647834778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,1536,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,1024,0.010358400146166484
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,512,0.0067007998625437425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,256,0.004970666766166687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,128,0.00472320020198822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,64,0.004271999994913737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,16384,32,0.004523733258247375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,16384,0.07485546271006266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,65536,0.2736799875895182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,12288,0.0556714653968811
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,8192,0.03973120053609212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,10240,0.04836693207422892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,7168,0.03420159816741943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,6144,0.031061333417892457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,5120,0.02635093331336975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,4096,0.022051199277242025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,3584,0.019387733936309815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,3072,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,2560,0.014860799908638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,2048,0.013502933581670127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,1536,0.010833066701889039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,1024,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,768,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,512,0.005858133236567179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,256,0.004785066843032837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,128,0.004334933559099833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,64,0.004419200122356415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,12288,32,0.0045621335506439206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,16384,0.06655999819437662
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,12288,0.05027733246485392
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,65536,0.2402986685434977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,10240,0.04348586797714234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,8192,0.03679253260294597
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,7168,0.031196800867716472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,6144,0.02805759906768799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,5120,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,4096,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,3072,0.01568000018596649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,3584,0.017681066195170084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,2560,0.014106667041778565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,2048,0.012342400352160136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,1536,0.010423466563224792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,1024,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,768,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,512,0.005448533097902933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,256,0.004923733572165171
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,128,0.0046634669105211895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,64,0.004356266558170318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,10240,32,0.004164266586303711
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,16384,0.05003946622212728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,65536,0.17919999758402508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,12288,0.037750399112701415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,10240,0.03331413269042969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,8192,0.02757973273595174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,7168,0.024029866854349772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,6144,0.02136853337287903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,5120,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,4096,0.015210666259129844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,3584,0.013906133174896241
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,3072,0.012341333429018657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,2560,0.01130986710389455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,2048,0.009920000036557516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,1536,0.008478933572769165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,1024,0.006200533111890157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,768,0.0054400001962979635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,512,0.004558933277924856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,256,0.004363733530044556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,128,0.003924266745646795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,64,0.0036629334092140196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,8192,32,0.003822933385769526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,16384,0.04655786752700806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,65536,0.16629865964253743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,12288,0.03502080043156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,10240,0.03051519989967346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,8192,0.025598933299382527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,7168,0.02232426603635152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,5120,0.01723840037981669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,1024,4096,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,4096,0.014245333274205527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,3584,0.013255467017491659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,3072,0.012060800194740295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,2560,0.010762666662534077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,2048,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,1536,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,1024,0.006293333570162455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,768,0.0061930666367212926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,512,0.0054400001962979635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,256,0.004278400043646494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,128,0.003999999910593033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,64,0.003921066721280416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,32,0.003947733342647553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,16384,0.04840213457743327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,65536,0.1539413293202718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,12288,0.037478399276733396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,10240,0.031947733958562215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,8192,0.02648746569951375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,7168,0.02341866691907247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,6144,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,5120,0.017658666769663493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,4096,0.014792533715566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,3584,0.013427199920018515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,3072,0.012437333663304646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,2560,0.010822400450706482
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,1536,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,2048,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,1024,0.0062943999965985615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,768,0.005738666653633118
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,512,0.00499839981396993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,256,0.004335999985535939
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,128,0.003924266745646795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,64,0.003958400090535482
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,6144,32,0.003924266745646795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,16384,0.0459445317586263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,65536,0.1409023920694987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,12288,0.035499731699625656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,10240,0.030377600590387983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,8192,0.02532800038655599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,7168,0.02225386699040731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,6144,0.019593600432078043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,5120,0.01684160033861796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,4096,0.014385066429773965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,3584,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,3072,0.01171946624914805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,2560,0.010424533486366272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,2048,0.009101866682370504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,1536,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,1024,0.005780266722043356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,768,0.0055978665749231975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,512,0.005031466484069824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,256,0.004350933432579041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,128,0.0040501333773136135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,64,0.003970133264859518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,5120,32,0.003659733384847641
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,16384,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,65536,0.10069440205891926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,192,128,4096,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,12288,0.02744320034980774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,10240,0.020137600104014077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,7168,0.01486186683177948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,8192,0.016711467504501344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,6144,0.01362986663977305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,5120,0.011587199568748475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,4096,0.010294399658838908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,3584,0.009604266285896302
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,3072,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,2048,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,2560,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,1536,0.006161066889762879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,1024,0.00491839994986852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,512,0.004331733286380768
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,768,0.004507733384768168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,256,0.003960533440113068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,128,0.0036789332826932275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,64,0.0035391998787721
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,4096,32,0.0036618667344252265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,12288,0.02512213389078776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,16384,0.030446932713190718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,65536,0.09263786474863688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,10240,0.024371200799942018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,7168,0.014385066429773965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,8192,0.016029866536458333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,6144,0.01325440009435018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,5120,0.011689600348472596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,4096,0.011934933066368104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,3584,0.009127466877301534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,3072,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,2560,0.007398400207360585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,2048,0.006499200065930684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,1536,0.005474133292833964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,768,0.004433066646258036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,512,0.003940266619126002
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,1024,0.004710400104522705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,256,0.004025600105524063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,128,0.0036085332433382668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,64,0.0035616000493367515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3584,32,0.0036960000793139136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,16384,0.02696533401807149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,12288,0.021757866938908896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,65536,0.07509333292643229
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,7168,0.01636373301347097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,8192,0.017784533898035686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,10240,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,5120,0.012560000022252401
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,6144,0.014791466792424521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,4096,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,3072,0.009060266613960265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,3584,0.009943466385205586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,2560,0.007905066510041555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,2048,0.0066655998428662615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,1536,0.005884799857934316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,1024,0.00521919975678126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,768,0.004621866842110952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,512,0.004382933179537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,128,0.0036799999574820197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,64,0.003470933437347412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,256,0.003966933240493139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,3072,32,0.0033941333492596946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,16384,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,12288,0.020068265994389854
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,65536,0.06744960149129232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,8192,0.015955199797948204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,7168,0.014281599720319112
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,10240,0.017869865894317626
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,6144,0.013154133160909017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,5120,0.011480533083279927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,4096,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,3584,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,3072,0.00837546686331431
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,2560,0.007425066828727722
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,2048,0.007115733126799266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,1536,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,1024,0.005120000243186951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,768,0.004654933512210846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,512,0.004419200122356415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,128,0.003905066599448522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,64,0.0035146666069825493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,256,0.003946666667858759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2560,32,0.003589333345492681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,16384,0.01923840045928955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,12288,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,65536,0.056049064795176184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,8192,0.014451199769973755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,7168,0.013666133085886637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,10240,0.015754666924476624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,6144,0.011618133385976155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,5120,0.010309333602587383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,4096,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,3584,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,3072,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,2560,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,2048,0.005849599838256836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,1536,0.005406933526198069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,768,0.004377600053946177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,512,0.003995733211437861
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,1024,0.004763733347256978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,256,0.004040533304214477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,128,0.00363520011305809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,64,0.003193599979082743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,2048,32,0.0035584000249703727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,16384,0.016438399751981102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,65536,0.043622398376464845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,12288,0.01546239952246348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,7168,0.012571733196576437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,8192,0.014859732985496522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,10240,0.014424533645311991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,6144,0.011332266529401143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,5120,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,4096,0.008691199620564779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,3584,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,3072,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,2560,0.006268799801667531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,2048,0.00581333339214325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,1536,0.005178666611512502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,768,0.004347733159859975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,512,0.004060799876848856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,1024,0.004833066463470459
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,256,0.004082133372624716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,128,0.0035317334036032355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,64,0.0032245332996050516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1536,32,0.0035402665535608927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,65536,0.031949865818023684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,12288,0.014860799908638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,16384,0.016849066813786825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,8192,0.011723732948303223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,10240,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,7168,0.011128532886505126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,6144,0.010513066252072652
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,5120,0.009127466877301534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,4096,0.011526399850845337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,3584,0.010698666175206501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,3072,0.010288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,2048,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,2560,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,1536,0.005049600203831991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,1024,0.004642133414745331
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,512,0.0040618665516376495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,768,0.004357333481311798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,256,0.003714133302370707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,128,0.003570133447647095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,64,0.003551999976237615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,1024,32,0.0036544000109036768
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,65536,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,12288,0.014485333363215128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,16384,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,8192,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,10240,0.01317759950955709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,7168,0.010706133643786113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,6144,0.010011733571688334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,5120,0.009057066837946574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,4096,0.008281599978605907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,3584,0.007076266904671986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,3072,0.006704000135262807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,2048,0.005475200215975444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,1536,0.005085866649945577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,2560,0.005857066810131073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,1024,0.00443200021982193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,768,0.004402133325735727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,512,0.004035199930270513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,256,0.0036447999378045404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,128,0.0034986667335033415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,64,0.0031178665657838186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,768,32,0.003206400076548258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,65536,0.02066453297932943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,12288,0.01158186693986257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,16384,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,10240,0.010354133447011311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,8192,0.009128533800443013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,7168,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,5120,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,6144,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,4096,0.007906133433183034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,3584,0.007012266914049785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,3072,0.006702933212121327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,2048,0.005407999952634176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,1536,0.004894933104515076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,2560,0.006200533111890157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,1024,0.004421333471934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,768,0.0040853333969910945
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,512,0.003920000046491623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,256,0.00359253336985906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,128,0.0035455999275048576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,32,0.0031839999059836066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,512,64,0.0031925333042939507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,65536,0.019364267587661743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,16384,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,12288,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,10240,0.012356266379356384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,8192,0.012812800208727517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,7168,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,6144,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,5120,0.008237866560618083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,3584,0.007490133245786031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,3072,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,4096,0.007566933333873749
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,2048,0.005373866856098175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,2560,0.00588266650835673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,1536,0.00462719996770223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,1024,0.004345599810282389
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,768,0.0040554667512575785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,512,0.0037109332780043284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,256,0.003602133442958196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,128,0.0031637333333492277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,32,0.003256533294916153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,256,64,0.0031776001056035364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,65536,0.015237333377202353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,16384,0.009810133775075277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,12288,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,10240,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,8192,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,7168,0.008215466638406117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,6144,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,5120,0.00745066652695338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,3584,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,3072,0.006602666775385539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,4096,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,2560,0.006702933212121327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,2048,0.006260266900062561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,1536,0.0048981333772341405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,1024,0.0044266665975252785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,768,0.003931733220815659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,512,0.003705599904060364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,256,0.0035487999518712364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,128,0.0032501332461833954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,32,0.003188266605138779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,128,64,0.003115733216206233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,65536,0.01568000018596649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,16384,0.009125333031018574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,12288,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,10240,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,8192,0.007456000149250031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,6144,0.006667733192443848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,7168,0.007021866738796234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,5120,0.006636799871921539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,4096,0.0062613333264986675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,3584,0.006677333513895671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,3072,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,2560,0.006636799871921539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,1536,0.00483840008576711
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,2048,0.006337066491444905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,1024,0.004340266684691111
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,768,0.004072533299525579
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,256,0.0034847999612490333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,512,0.0037077332536379496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,128,0.0033290666838486993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,64,0.00311253344019254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,64,32,0.003160533308982849
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,16384,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,65536,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,12288,0.007494399944941203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,10240,0.0074527998765309645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,8192,0.007076266904671986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,7168,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,6144,0.006629333396752675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,5120,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,3584,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,3072,0.00643093337615331
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,4096,0.006201600035031637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,2560,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,2048,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,1536,0.004799999793370565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,1024,0.004312533140182495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,768,0.003990400085846583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,7168,6144,0.020139733950297035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,512,0.003659733384847641
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,256,0.003522133330504099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,128,0.00329066663980484
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,64,0.003310933212439219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,160,32,32,0.002974933385848999
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,12288,0.2754570643107096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,10240,0.2379744052886963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,8192,0.197324800491333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,16384,0.37888212203979493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,4096,0.09830400149027506
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,6144,0.14984532992045085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,7168,0.16561493873596192
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,5120,0.12148266633351643
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,3584,0.08611839612325033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,2560,0.06445759932200114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,3072,0.07549973328908285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,2048,0.05410133202870687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,1536,0.04041386842727661
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,1024,0.028124799331029255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,768,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,512,0.016100266575813295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,128,0.007507200042406718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,256,0.01076586643854777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,64,0.00790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,65536,32,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,12288,0.0637941320737203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,16384,0.09147733052571615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,10240,0.05457813342412313
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,8192,0.044715734322865804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,7168,0.03932160139083862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,6144,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,65536,0.3224917411804199
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,4096,0.025462400913238526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,5120,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,3072,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,2048,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,3584,0.022529067595799764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,1536,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,1024,0.009080533186594646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,768,0.007904000083605449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,512,0.005747200051943461
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,256,0.004676266511281332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,128,0.004389333228270212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,64,0.004358399907747904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,32,0.004513066510359446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,16384,0.06734506289164224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,12288,0.04922026793162028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,10240,0.04184746742248535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,8192,0.034746666749318436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,65536,0.23729492823282877
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,7168,0.030923734108606975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,6144,0.02757973273595174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,5120,0.024099200963974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,4096,0.019387733936309815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,3584,0.017667200167973837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,3072,0.015550933281580605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,2560,0.01362986663977305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,2048,0.011797333757082622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,1024,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,768,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,1536,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,512,0.005766400198141734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,256,0.00452693353096644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,128,0.004387199878692627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,64,0.0040522667268912
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,12288,32,0.004489600161711375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,16384,0.05604693492253622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,12288,0.04150613149007161
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,8192,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,65536,0.19787200291951496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,10240,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,5120,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,7168,0.026140799125035603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,6144,0.023755733172098795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,4096,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,3584,0.015075199802716575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,3072,0.013194666306177775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,2560,0.011989333232243856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,2048,0.01046506663163503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,1536,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,1024,0.006702933212121327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,768,0.005448533097902933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,256,0.004507733384768168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,512,0.004741333425045013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,128,0.004105599969625473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,64,0.0039007999002933502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,10240,32,0.004252799848715464
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,16384,0.04656853278477986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,65536,0.18657280604044596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,12288,0.03420159816741943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,10240,0.0301749328772227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,8192,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,7168,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,6144,0.01991466681162516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,5120,0.01726079980532328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,4096,0.013979732990264893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,3584,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,3072,0.011592533191045125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,2048,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,2560,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,1536,0.007906133433183034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,1024,0.005850666761398315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,768,0.005415466427803039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,512,0.004530133306980133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,256,0.004418133199214936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,64,0.0038954667747020722
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,128,0.004056533426046371
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,8192,32,0.004029866556326548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,12288,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,16384,0.04246400197347005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,65536,0.16486399968465168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,10240,0.027127466599146527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,8192,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,6144,0.017591466506322227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,7168,0.01972800095876058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,5120,0.015209600329399109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,4096,0.012845866878827415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,3584,0.011590400338172912
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,3072,0.010637866457303365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,2560,0.009693866968154908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,2048,0.008453333377838134
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,1024,0.00544106662273407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,768,0.0045621335506439206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,1536,0.007051733136177063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,512,0.004517333209514618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,256,0.004020266731580098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,128,0.0036906667053699495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,64,0.0036608000596364343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,7168,32,0.00388373335202535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,16384,0.037546666463216145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,65536,0.14670507113138836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,10240,0.02525866627693176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,8192,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,6144,0.016023466984430947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,5120,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,7168,0.017873066663742065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,4096,0.011923199892044068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,3584,0.01090773344039917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,3072,0.010160000125567118
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,2560,0.009194667140642803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,2048,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,1536,0.0064735998709996535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,1024,0.005120000243186951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,768,0.0047647997736930845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,256,0.004092800120512644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,512,0.004398933549722036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,128,0.0038975998759269714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,64,0.0036757332583268487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,6144,32,0.003992533435424169
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,16384,0.03863893349965413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,65536,0.1154741366704305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,12288,0.031402667363484696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,10240,0.022731733322143555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,8192,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,7168,0.01650879979133606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,6144,0.014859732985496522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,5120,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,4096,0.011060266693433126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,3584,0.010354133447011311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,3072,0.009270399808883667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,2048,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,2560,0.008520533641179402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,1536,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,1024,0.005248000224431356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,512,0.004362666606903076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,768,0.004819199939568837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,256,0.004029866556326548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,128,0.003966933240493139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,64,0.0035743998984495797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,5120,32,0.0036288000643253326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,12288,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,16384,0.031674667199452715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,65536,0.10007893244425456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,10240,0.01950506567955017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,7168,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,8192,0.016028799613316855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,6144,0.013118933637936911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,5120,0.011559466520945232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,4096,0.009955199559529622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,3584,0.00940053363641103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,3072,0.008316799998283386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,2048,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,2560,0.007460266848405202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,1536,0.005448533097902933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,1024,0.004884266853332519
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,768,0.0043712000052134195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,512,0.004026666780312856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,256,0.003976533313592275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,128,0.004001066585381826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,64,0.0037632000943024955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,4096,32,0.003997866561015447
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,16384,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,12288,0.022233599424362184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,65536,0.08946346441904704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,10240,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,8192,0.015474133690198264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,5120,0.011173333724339802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,6144,0.012410666545232136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,7168,0.013780267039934794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,4096,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,3584,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,3072,0.007974400122960409
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,2560,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,2048,0.006233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,1536,0.005449600021044413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,1024,0.004858666658401489
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,768,0.004443733394145966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,256,0.003915733347336451
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,512,0.004033066580692927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,128,0.00367253323396047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,64,0.0035936000446478524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3584,32,0.004133333265781402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,16384,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,65536,0.0734549363454183
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,12288,0.020603734254837035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,10240,0.018413867553075156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,8192,0.014801067113876343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,7168,0.01322879989941915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,6144,0.012267733613650005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,5120,0.010807466506958009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,3584,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,4096,0.009342933694521587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,3072,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,2560,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,1536,0.005379199981689453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,2048,0.006164266665776571
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,1024,0.004826666911443075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,768,0.0046069333950678505
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,512,0.004350933432579041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,256,0.004084266722202301
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,128,0.003929600119590759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,64,0.0036149332920710243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,3072,32,0.0038794666528701783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,12288,0.018959999084472656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,65536,0.06533120075861612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,16384,0.02196906606356303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,10240,0.01725013256072998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,8192,0.014800000190734863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,7168,0.014016000429789224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,6144,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,5120,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,4096,0.00906986693541209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,3584,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,3072,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,2048,0.005849599838256836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,2560,0.006611200173695882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,1536,0.005378133555253347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,1024,0.004782933493455251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,512,0.003977599988381068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,768,0.004494933287302653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,256,0.004042666653792063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,128,0.003605333218971888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,64,0.0036138666172822317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2560,32,0.0036789332826932275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,12288,0.015204266707102457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,65536,0.057633066177368165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,16384,0.018209065993626913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,10240,0.01492586632569631
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,8192,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,7168,0.012755200266838074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,6144,0.01160533328851064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,5120,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,4096,0.00862506628036499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,3584,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,3072,0.00664106657107671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,2560,0.006165333092212677
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,2048,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,1536,0.005039999882380167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,768,0.00439680020014445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,1024,0.004773333172003428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,512,0.003933866570393244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,256,0.0036661334335803984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,64,0.003159466634194056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,128,0.003502933432658514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,2048,32,0.0032661333680152893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,16384,0.015688533584276833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,12288,0.01356160044670105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,65536,0.04321066538492839
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,8192,0.011585066715876263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,7168,0.010804266730944315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,10240,0.0127893328666687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,6144,0.011175466577212016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,5120,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,4096,0.00790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,3584,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,3072,0.006640000144640605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,2560,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,2048,0.005508266886075338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,1536,0.004970666766166687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,768,0.004435199995835622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,1024,0.004755199948946635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,512,0.004011733333269755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,256,0.0037151999771595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,64,0.003349333256483078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,128,0.003522133330504099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1536,32,0.00352960005402565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,16384,0.012583466370900473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,12288,0.014519466956456503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,65536,0.030583467086156207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,8192,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,7168,0.010327466328938802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,10240,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,6144,0.009911466638247173
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,5120,0.008660266796747845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,4096,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,3584,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,3072,0.006611200173695882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,2560,0.0058559998869895935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,2048,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,1536,0.004971733192602793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,768,0.004346666733423868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,1024,0.0045045331120491024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,512,0.003990400085846583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,256,0.0036170666416486105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,64,0.0032511999209721885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,128,0.0035455999275048576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,1024,32,0.0032416000962257386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,16384,0.013640532890955607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,12288,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,65536,0.026419200499852497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,8192,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,7168,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,10240,0.010294399658838908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,6144,0.00851200024286906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,5120,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,4096,0.00790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,3584,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,3072,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,2560,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,2048,0.005474133292833964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,1536,0.0049450665712356566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,768,0.004116266717513402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,1024,0.004435199995835622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,512,0.003944533318281174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,256,0.003668266783157984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,64,0.0032469332218170166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,128,0.0030400000512599947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,768,32,0.0032757334411144257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,16384,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,65536,0.018634666999181114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,12288,0.009551999966303508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,7168,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,8192,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,10240,0.009546666344006857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,6144,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,5120,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,4096,0.0074976002176602675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,3584,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,3072,0.0065760001540184024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,2560,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,2048,0.005406933526198069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,1536,0.004935466746489207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,768,0.004278400043646494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,1024,0.0043488000830014546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,512,0.003668266783157984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,256,0.00365226666132609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,64,0.0032746667663256326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,128,0.0032373333970705668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,512,32,0.0032511999209721885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,16384,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,65536,0.016032000382741295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,12288,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,8192,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,7168,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,10240,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,16384,2560,0.017407999436060587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,6144,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,5120,0.008273066580295562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,3584,0.007387733459472657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,4096,0.007496533294518788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,2560,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,3072,0.006985599795977275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,2048,0.006347733239332835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,1536,0.004954666892687479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,1024,0.004469333092371622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,768,0.004119466741879781
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,512,0.003697066754102707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,128,0.0032650666932264962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,256,0.0035861333211263022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,32,0.003206400076548258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,256,64,0.0031871999303499854
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,12288,0.00851093331972758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,10240,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,16384,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,65536,0.015307733416557312
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,8192,0.007490133245786031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,7168,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,5120,0.0066336000959078475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,6144,0.006676266590754191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,4096,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,3584,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,3072,0.006724266707897187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,2560,0.006679466863473256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,2048,0.006636799871921539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,1536,0.004729599754015604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,1024,0.004456533491611481
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,512,0.003701333453257879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,768,0.004005333284536997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,256,0.0033183999359607695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,128,0.0033173332611719764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,64,0.003147733211517334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,16384,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,128,32,0.003102933367093404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,65536,0.01360640029112498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,12288,0.007863466441631318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,10240,0.007521066566308339
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,8192,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,7168,0.006985599795977275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,6144,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,5120,0.006894933183987935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,3072,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,3584,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,4096,0.00624533345301946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,2560,0.006704000135262807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,2048,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,1536,0.00472320020198822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,1024,0.004166399935881296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,768,0.004035199930270513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,512,0.0037216000258922578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,256,0.003257599969704946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,64,0.0032159999012947083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,128,0.00314026673634847
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,64,32,0.0031199999153614043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,16384,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,65536,0.013230933745702108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,10240,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,12288,0.007496533294518788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,8192,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,7168,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,6144,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,5120,0.006299733122189839
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,4096,0.0065194666385650635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,3584,0.006198399762312571
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,3072,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,2048,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,2560,0.006266666452089946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,1024,0.003997866561015447
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,1536,0.004738133152325948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,768,0.0039989332358042395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,256,0.003222399950027466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,128,0.0031968000034491217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,512,0.0035455999275048576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,64,0.0032298666735490165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,128,32,32,0.0031797334551811217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,8192,0.17380693753560383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,12288,0.2733386675516764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,16384,0.37872212727864585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,10240,0.20777066548665366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,4096,0.08956586519877116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,5120,0.10795733133951824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,7168,0.1460693359375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,6144,0.13148159980773927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,2560,0.05792426665623983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,3584,0.07799466451009116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,3072,0.06785600185394287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,2048,0.048843733469645184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,1024,0.026555732885996504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,768,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,1536,0.03713599840799968
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,512,0.014812800288200378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,256,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,64,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,65536,32,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,12288,0.06512639919916788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,16384,0.08925759792327881
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,10240,0.055638400713602695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,8192,0.04676266511281331
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,7168,0.03993493318557739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,6144,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,65536,0.33071893056233725
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,4096,0.0256661335627238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,5120,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,3072,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,2560,0.017249067624409996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,2048,0.013983999689420065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,3584,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,1024,0.008854400118192036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,1536,0.011481600006421407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,768,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,512,0.005415466427803039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,256,0.0044490665197372435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,128,0.004333866635958353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,64,0.0039893334110577905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,16384,32,0.004012800008058548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,16384,0.07372799714406332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,12288,0.05485226710637411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,10240,0.04706986745198567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,8192,0.03822933435440064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,7168,0.03331413269042969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,65536,0.2657621383666992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,6144,0.030105600754419964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,5120,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,4096,0.021375999848047892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,3584,0.018979199727376304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,2560,0.014754133423169455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,3072,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,2048,0.012757333119710288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,1536,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,1024,0.008543999989827473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,512,0.005381333331267038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,256,0.004929066697756449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,768,0.0066453332702318835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,128,0.004485333462556204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,32,0.004182399809360504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,16384,0.059938132762908936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,12288,0.04293973445892334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,65536,0.21562026341756185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,8192,0.030514132976531983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,10240,0.03805013497670491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,6144,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,5120,0.02116159995396932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,7168,0.028194133440653486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,4096,0.01725226640701294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,3584,0.015748266379038492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,3072,0.014834133783976236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,2560,0.012231466174125672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,2048,0.01074133316675822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,1536,0.009473066528638203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,1024,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,768,0.005850666761398315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,256,0.004605866471926371
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,128,0.004081066697835922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,512,0.005348266661167144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,64,0.003969066590070724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,10240,32,0.004147200038035711
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,16384,0.04952746629714966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,12288,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,65536,0.17769813537597656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,8192,0.026419200499852497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,10240,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,7168,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,5120,0.017661867539087932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,6144,0.020890667041142782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,3584,0.013289599617322286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,3072,0.012026666601498922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,4096,0.014668800433476768
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,2560,0.010797866185506185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,2048,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,1536,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,1024,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,768,0.004669866462548574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,512,0.0045162667830785114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,256,0.003995733211437861
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,128,0.003738666574160258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,32,0.003970133264859518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,8192,64,0.0036256000399589538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,16384,0.04512319962183635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,12288,0.03345066706339518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,65536,0.16226879755655926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,10240,0.029967999458312987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,7168,0.022459733486175536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,8192,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,6144,0.019640533129374187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,5120,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,4096,0.014221866925557455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,3584,0.01318933367729187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,3072,0.011969066659609477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,2048,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,2560,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,1536,0.007828266421953837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,1024,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,512,0.004856533308823904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,768,0.00565119981765747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,256,0.004515199859937032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,128,0.004068266600370407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,64,0.0034485332667827605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,7168,32,0.004010666658480962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,12288,0.03310933311780294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,16384,0.04239146709442139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,65536,0.1305941343307495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,10240,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,8192,0.022923733790715536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,7168,0.019368533293406168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,6144,0.01731733282407125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,4096,0.012813867131868998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,5120,0.015413332978884378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,3584,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,3072,0.010696533322334289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,2048,0.00858133335908254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,2560,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,1536,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,1024,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,768,0.0052373334765434265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,512,0.004509866734345754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,256,0.003988266736268997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,128,0.003734400123357773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,64,0.0035616000493367515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,6144,32,0.0034986667335033415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,12288,0.030037333567937214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,16384,0.03704426685969035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,65536,0.11475626627604167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,8192,0.01863893270492554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,7168,0.016500266393025716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,5120,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,6144,0.014800000190734863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,4096,0.012060800194740295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,3584,0.011241599917411804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,3072,0.010434133807818095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,2560,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,2048,0.00796693315108617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,1536,0.006712533533573151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,1024,0.005430399874846141
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,768,0.00525439977645874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,256,0.004014933357636133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,128,0.00367253323396047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,512,0.004823466638724009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,64,0.0035904000202814737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,5120,32,0.0036650667587916053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,16384,0.030446932713190718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,12288,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,65536,0.09700693289438883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,10240,0.020936532815297445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,8192,0.016156799594561257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,7168,0.014252799749374389
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,6144,0.013155200084050498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,5120,0.011868799726168316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,3584,0.009399466713269551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,4096,0.009955199559529622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,3072,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,2560,0.007417599856853485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,1536,0.00544106662273407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,2048,0.006268799801667531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,1024,0.00486826648314794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,768,0.004498133560021719
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,512,0.0040618665516376495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,256,0.004004266609748204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,128,0.0036778666079044344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,32,0.003656533360481262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,4096,64,0.0035946667194366455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,16384,0.028125866254170732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,12288,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,10240,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,8192,0.01691733400026957
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,7168,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,6144,0.012549333771069846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,5120,0.011174399654070537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,3584,0.00871573289235433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,4096,0.00963200032711029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,3072,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,2560,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,2048,0.006258133550484974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,1536,0.005073066552480062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,1024,0.0045525332291920986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,512,0.0042026668787002565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,768,0.0043818667531013485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,256,0.003980800012747447
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,128,0.003443199892838796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,64,0.0035968000690142312
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,32,0.00365226666132609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,65536,0.0722261349360148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,16384,0.024985599517822265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,12288,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,10240,0.01657600005467733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,8192,0.014792533715566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,7168,0.013160533706347146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,6144,0.012133333086967468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,4096,0.00953493316968282
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,5120,0.010731732845306397
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,3584,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,3072,0.007874133189519246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,2560,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,1536,0.005407999952634176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,2048,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,1024,0.004587733248869578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,768,0.004399999976158142
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,512,0.003980800012747447
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,256,0.003656533360481262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,128,0.003509333233038584
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,32,0.003509333233038584
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3072,64,0.0031968000034491217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,16384,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,65536,0.0612010677655538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,10240,0.016637866695721946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,12288,0.01800959904988607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,8192,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,7168,0.01285546620686849
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,6144,0.011787733435630799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,5120,0.010397866368293762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,4096,0.00871573289235433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,3072,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,3584,0.00817920019229253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,2560,0.006972800195217133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,2048,0.005860266586144766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,1536,0.00505920002857844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,1024,0.004497066636880239
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,768,0.004403199752171834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,256,0.003643733263015747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,512,0.004016000032424927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,128,0.0035445332527160645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,64,0.003222399950027466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2560,32,0.003519999980926514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,16384,0.020137600104014077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,65536,0.05007253487904867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,12288,0.016639999548594155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,10240,0.015211733182271323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,8192,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,6144,0.011617066462834676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,7168,0.012034133076667786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,5120,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,4096,0.010433066884676616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,3584,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,3072,0.008661333719889324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,2560,0.0074869334697723385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,1536,0.005032533407211303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,2048,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,1024,0.00476800004641215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,768,0.004340266684691111
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,512,0.004026666780312856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,256,0.0037717332442601522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,128,0.0035829332967599234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,32,0.0035914666950702667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,2048,64,0.0034272000193595886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,65536,0.0418442686398824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,16384,0.015756799777348836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,12288,0.01341759959856669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,10240,0.013640532890955607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,8192,0.012370133399963379
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,7168,0.011523200074831645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,6144,0.010900266965230306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,5120,0.009546666344006857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,4096,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,3072,0.006977066894372304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,3584,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,2560,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,2048,0.00544213354587555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,1536,0.005030400057633718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,768,0.004331733286380768
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,1024,0.004369066655635833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,512,0.003999999910593033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,256,0.003655466685692469
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,128,0.0035786665976047516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,64,0.003219199925661087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1536,32,0.003186133255561193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,16384,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,65536,0.02990079919497172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,12288,0.012333866953849793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,10240,0.011556266744931539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,8192,0.010453333457310993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,6144,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,7168,0.012152533729871113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,5120,0.010288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,4096,0.009102933605511983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,3584,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,3072,0.00664213349421819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,2560,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,1536,0.005883733431498209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,2048,0.006607999900976817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,1024,0.00492799977461497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,768,0.004743466774622599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,512,0.004422399898370107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,128,0.0036117332677046456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,256,0.003621333340803782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,64,0.00359253336985906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,1024,32,0.0035797332723935447
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,65536,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,16384,0.016849066813786825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,12288,0.014146133263905843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,10240,0.012780800461769104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,8192,0.011585066715876263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,7168,0.010398933291435241
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,6144,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,4096,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,5120,0.009476266304651896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,3584,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,3072,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,2560,0.005849599838256836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,2048,0.005425066749254862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,1536,0.004861866434415182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,768,0.004040533304214477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,1024,0.004448000093301137
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,512,0.003947733342647553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,256,0.0035989334185918174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,128,0.0032405334214369455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,64,0.0032597333192825317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,768,32,0.003236266722281774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,16384,0.012845866878827415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,65536,0.02211839954058329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,12288,0.010424533486366272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,12288,64,0.003973333289225897
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,8192,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,10240,0.010914132992426554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,6144,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,5120,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,7168,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,4096,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,3584,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,2560,0.006479999919732411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,3072,0.007289599875609081
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,1536,0.005492266515890757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,2048,0.005895466605822245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,1024,0.005038933455944061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,768,0.004386133452256521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,512,0.0041909332076708475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,256,0.004238933324813843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,128,0.004553600152333578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,64,0.003455999990304311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,512,32,0.0039818666875362395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,65536,0.02056000034014384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,16384,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,12288,0.009147733449935913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,10240,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,8192,0.009113599856694538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,6144,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,7168,0.008226133386294047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,4096,0.007748266557852428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,3584,0.008090666433175405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,5120,0.008328533172607422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,3072,0.007201066613197327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,2560,0.007303466896216075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,2048,0.006945066650708516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,1536,0.005243733525276184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,1024,0.004744533201058706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,768,0.004423466821511587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,512,0.003774933268626531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,256,0.003521066655715307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,64,0.003565866748491923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,128,0.004121600091457367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,256,32,0.0036799999574820197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,65536,0.01486186683177948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,16384,0.009546666344006857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,12288,0.008602666854858398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,10240,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,8192,0.0076799998680750535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,6144,0.006701866785685222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,7168,0.008082133531570435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,5120,0.006875733534495036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,4096,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,3584,0.00717439999183019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,2560,0.007417599856853485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,3072,0.006836266815662384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,2048,0.007705600063006084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,1536,0.005137066543102265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,1024,0.004599466423193614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,768,0.004342400034268697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,512,0.003933866570393244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,64,0.0038111999630928038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,256,0.0037461332976818085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,128,0.0036586667100588477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,128,32,0.003714133302370707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,16384,0.00897706647713979
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,65536,0.01316480040550232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,12288,0.007857066889603932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,10240,0.008055466910203297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,7168,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,8192,0.007528533538182576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,6144,0.007231999933719635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,5120,0.006554666658242543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,4096,0.006520533561706543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,3072,0.006658133367697399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,3584,0.006819200019041698
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,2560,0.006906666855017345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,2048,0.006337066491444905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,1536,0.005226666728655497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,768,0.004312533140182495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,1024,0.00486826648314794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,512,0.004242133100827535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,256,0.003668266783157984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,128,0.0035189333061377203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,64,0.003551999976237615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,64,32,0.003286399940649668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,12288,0.00782719999551773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,16384,0.008087466657161712
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,65536,0.011970133582750956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,10240,0.007414400080839793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,8192,0.007796266674995422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,7168,0.007627733548482259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,6144,0.007337599992752075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,5120,0.006852266689141591
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,4096,0.006433066725730896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,3584,0.006227200229962667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,3072,0.006552533308664958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,2048,0.006692266464233399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,2560,0.006906666855017345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,1024,0.0044159998496373495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,1536,0.005008000135421753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,768,0.004329599936803182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,512,0.0038880000511805216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,256,0.003673599908749262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,64,0.0033952000240484873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,128,0.0032874666154384612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,32,32,0.004081066697835922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,12288,0.26753921508789064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,10240,0.21486934026082358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,16384,0.3757472038269043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,7168,0.1505280017852783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,6144,0.1301162640253703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,8192,0.17510186831156413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,4096,0.08949759801228842
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,5120,0.10990933577219646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,3584,0.07799039681752523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,3072,0.06809600194295248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,2560,0.05775359869003296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,2048,0.04754879872004191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,1536,0.03665813207626343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,1024,0.02640639940897624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,768,0.02097813288370768
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,512,0.014518400033315023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,256,0.009921066959698995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,128,0.007507200042406718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,64,0.006894933183987935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,65536,32,0.007649066547552745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,96,3584,65536,0.07990612983703613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,16384,0.08755306402842203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,12288,0.0626688003540039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,10240,0.053725866476694736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,8192,0.04475520054499309
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,7168,0.03843413194020589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,65536,0.31293439865112305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,5120,0.029743999242782593
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,6144,0.03426986535390218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,4096,0.023847466707229613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,3072,0.019232000907262167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,2560,0.016569599509239197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,1024,0.008854400118192036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,1536,0.01136959989865621
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,2048,0.013518933455149332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,512,0.005474133292833964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,256,0.004588800172011057
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,128,0.0042133331298828125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,64,0.0040501333773136135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,32,0.004289066791534424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,16384,0.07389547030131022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,12288,0.054647465546925865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,65536,0.2508117357889811
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,10240,0.047172268231709794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,8192,0.03945813179016113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,7168,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,6144,0.030364799499511718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,5120,0.025649066766103106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,4096,0.0217631995677948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,3584,0.01895573337872823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,3072,0.01637226641178131
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,2560,0.014485333363215128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,1536,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,2048,0.012754133343696595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,1024,0.008306133250395458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,768,0.006894933183987935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,512,0.006007466713587443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,256,0.004920533299446106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,128,0.004249600072701773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,32,0.004264533519744873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,12288,64,0.004277333120505015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,16384,0.06109973192214966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,65536,0.20695039431254067
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,12288,0.046217600504557296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,10240,0.036999468008677164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,8192,0.03289600014686585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,7168,0.02735466758410136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,6144,0.02387946645418803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,5120,0.021002666155497233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,4096,0.01842026710510254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,3584,0.015475199619928996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,3072,0.014051199952761332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,2560,0.012745599945386252
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,2048,0.0107424000898997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,1536,0.009057066837946574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,768,0.005919999877611796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,1024,0.00877333382765452
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,512,0.005751466751098633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,256,0.005166933437188466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,128,0.0042805333932240805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,64,0.004289066791534424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,10240,32,0.004125866790612539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,16384,0.0500053326288859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,65536,0.1712821324666341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,12288,0.03672746817270915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,8192,0.02639893293380737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,10240,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,7168,0.023052799701690673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,6144,0.020568533738454183
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,5120,0.017762132485707603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,4096,0.014667733510335287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,3584,0.013293866316477457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,3072,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,2560,0.010698666175206501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,1536,0.007865599791208903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,2048,0.009545600414276123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,1024,0.006968533496061961
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,768,0.005510400235652924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,512,0.005075199902057648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,256,0.004333866635958353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,128,0.004785066843032837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,32,0.00405973345041275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,8192,64,0.003952000041802724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,16384,0.04719680150349935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,65536,0.158788267771403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,12288,0.037614933649698895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,10240,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,8192,0.02626986702283223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,7168,0.02523840069770813
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,6144,0.022721066077550253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,5120,0.01946773330370585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,3584,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,4096,0.016302933295567833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,3072,0.011517866452534994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,2560,0.010363733768463135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,2048,0.00929813285668691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,1536,0.008055466910203297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,1024,0.005835733314355215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,768,0.005246933301289876
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,512,0.004642133414745331
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,256,0.004323199888070424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,128,0.0034282666941483817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,32,0.0042453333735466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,7168,64,0.003993600110212962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,16384,0.04007360140482585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,65536,0.12622506618499757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,12288,0.03159466584523519
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,10240,0.028534400463104247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,8192,0.022446932395299275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,7168,0.019232000907262167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,6144,0.016850133736928306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,5120,0.014860799908638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,3584,0.011994666854540507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,4096,0.012754133343696595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,3072,0.01107413371404012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,2560,0.010102400183677673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,2048,0.009060266613960265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,1536,0.0075434664885203045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,1024,0.006381866832574208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,768,0.0056757330894470215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,512,0.005074133475621542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,256,0.004351999859015147
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,128,0.0046293333172798155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,32,0.003806933263937632
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,6144,64,0.003824000060558319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,16384,0.035224533081054686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,65536,0.10833919843037923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,10240,0.02518933415412903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,8192,0.02190293272336324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,7168,0.019233065843582153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,6144,0.01456106702486674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,5120,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,4096,0.011115733782450359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,3584,0.010356266299883525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,3072,0.010706133643786113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,2560,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,2048,0.007841066519419352
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,1536,0.00701333334048589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,1024,0.005449600021044413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,768,0.004997333387533823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,256,0.0041696002086003625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,512,0.00462719996770223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,128,0.0036874666810035707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,64,0.003705599904060364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,5120,32,0.0036661334335803984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,16384,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,65536,0.09175146420796712
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,10240,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,8192,0.016362667083740234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,7168,0.014325333635012307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,6144,0.013220266501108805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,5120,0.011558399597803751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,4096,0.010216533144315084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,3584,0.009409067034721375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,3072,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,2560,0.007461333274841308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,2048,0.006568533182144165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,1536,0.00561599979797999
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,1024,0.004839466512203216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,768,0.004558933277924856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,512,0.004092800120512644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,256,0.003701333453257879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,128,0.0037151999771595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,64,0.003667200108369192
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,4096,32,0.003689600030581156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,16384,0.026419200499852497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,65536,0.07669760386149088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,12288,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,10240,0.01964906652768453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,8192,0.017321600516637167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,7168,0.017189333836237587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,6144,0.016088533401489257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,4096,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,5120,0.011410133043924967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,3584,0.008719999591509502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,3072,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,2560,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,2048,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,1536,0.005133866767088572
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,1024,0.004923733572165171
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,768,0.004390400151411692
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,512,0.004042666653792063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,256,0.0036661334335803984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,128,0.0035936000446478524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,64,0.003323733309904734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3584,32,0.003602133442958196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,16384,0.023895466327667238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,65536,0.0688149372736613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,10240,0.017386666933695474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,12288,0.018899200359980266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,8192,0.015202132860819497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,7168,0.013299199938774108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,6144,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,5120,0.010739200313886007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,4096,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,3584,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,3072,0.007929599781831106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,2560,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,2048,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,1536,0.005342933535575867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,1024,0.004862933357556661
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,768,0.004548266530036926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,512,0.004188799858093261
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,256,0.003717333326737086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,128,0.0036906667053699495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,64,0.003323733309904734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,3072,32,0.0035989334185918174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,16384,0.021552000443140665
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,65536,0.058606934547424314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,12288,0.017729065815607705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,10240,0.015825066963831583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,8192,0.014380799730618796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,7168,0.01340053379535675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,6144,0.011673600474993388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,5120,0.010294399658838908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,4096,0.009128533800443013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,3584,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,3072,0.007441066702206929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,2560,0.006677333513895671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,2048,0.005851733187834421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,1024,0.004846933484077454
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,1536,0.005039999882380167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,768,0.004178133110205332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,512,0.004167466859022776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,256,0.0036469332873821257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,128,0.0036544000109036768
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,64,0.0032426667710145317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2560,32,0.0032245332996050516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,16384,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,65536,0.048401065667470294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,12288,0.01569066643714905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,10240,0.0144405335187912
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,7168,0.012131200234095255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,8192,0.012754133343696595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,6144,0.011241599917411804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,5120,0.009885866443316143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,4096,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,3584,0.009542399644851684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,3072,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,2560,0.007463466624418895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,2048,0.005474133292833964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,1536,0.005221333106358846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,1024,0.0045952002207438145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,768,0.004394666850566864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,512,0.004112000018358231
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,256,0.0036906667053699495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,128,0.003638399889071783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,64,0.0033002667129039764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,2048,32,0.00359253336985906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,16384,0.015612799922625223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,65536,0.04089173475901286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,12288,0.013596799969673157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,3584,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,10240,0.013707733154296875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,8192,0.012349866827329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,6144,0.01111466685930888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,7168,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,5120,0.00981119970480601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,16384,768,0.007145600020885467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,4096,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,3584,0.007427200178305308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,3072,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,2560,0.006190933287143707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,2048,0.005494399865468343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,1024,0.004556799928347269
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,1536,0.005331199864546458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,768,0.004421333471934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,512,0.003964799890915553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,256,0.003701333453257879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,128,0.003311999887228012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,64,0.003257599969704946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1536,32,0.0032426667710145317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,65536,0.02908160090446472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,12288,0.01242453356583913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,10240,0.011468799908955891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,16384,0.012344533205032348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,8192,0.009947733084360758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,7168,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,6144,0.010705066720644633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,5120,0.010364799698193868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,4096,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,3584,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,3072,0.006860800087451935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,2048,0.006381866832574208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,2560,0.00589333325624466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,1536,0.005667200187842051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,1024,0.005245866874853769
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,768,0.0048096001148223875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,256,0.003671466559171677
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,512,0.004095999896526337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,128,0.003655466685692469
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,64,0.0033781332274278007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,1024,32,0.003656533360481262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,16384,0.01688213348388672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,12288,0.01399679978688558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,65536,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,10240,0.012403200070063274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,8192,0.01138879954814911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,7168,0.010289067029953003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,5120,0.008683733145395915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,6144,0.009100799759229023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,3584,0.007114666700363159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,4096,0.007701333363850911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,3072,0.0066336000959078475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,2560,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,2048,0.00544213354587555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,1536,0.005145599941412607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,1024,0.004500266909599304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,768,0.00410453329483668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,512,0.004081066697835922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,128,0.0036618667344252265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,256,0.0036256000399589538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,32,0.0032618666688601174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,768,64,0.0033514666060606635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,16384,0.013040000200271606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,65536,0.01834239959716797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,12288,0.011381333072980244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,8192,0.008725333213806152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,10240,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,7168,0.008342400193214417
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,6144,0.00793280005455017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,5120,0.008316799998283386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,3584,0.007111466427644093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,4096,0.007464533547560374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,3072,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,2560,0.005857066810131073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,2048,0.005746133128801982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,1024,0.004499199986457825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,1536,0.004924799998601278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,512,0.00402453343073527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,768,0.004046933352947235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,256,0.0036608000596364343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,128,0.0032853332658608755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,64,0.003401600072781245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,512,32,0.0034901333351929987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,65536,0.018478933970133463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,12288,0.010286933183670044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,16384,0.009885866443316143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,10240,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,8192,0.008616532882054646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,7168,0.008274133503437042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,5120,0.00787306676308314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,6144,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,4096,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,3584,0.0074527998765309645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,3072,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,2048,0.005407999952634176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,2560,0.006612266600131989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,1536,0.004984533290068308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,1024,0.0045045331120491024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,768,0.004020266731580098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,512,0.004259199897448222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,256,0.003667200108369192
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,64,0.0031189332405726117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,32,0.0033258666594823206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,65536,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,16384,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,10240,0.009127466877301534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,8192,0.008306133250395458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,12288,0.008283733328183492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,7168,0.008236800134181977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,6144,0.0075914666056633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,5120,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,4096,0.007009066641330719
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,3584,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,3072,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,2048,0.006262399752934774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,2560,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,1024,0.004408533374468485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,1536,0.004783999919891357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,768,0.0040554667512575785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,512,0.0036330667634805044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,128,0.0033130665620168054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,256,0.003239466746648153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,64,0.0031839999059836066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,128,32,0.0031839999059836066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,65536,0.014013866583506266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,16384,0.008260266482830047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,12288,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,8192,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,7168,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,10240,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,6144,0.006636799871921539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,5120,0.006292266647020976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,4096,0.006211199859778086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,3584,0.00643093337615331
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,3072,0.0063274666666984555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,2560,0.0061951999862988796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,2048,0.005847466488679251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,1536,0.004922666649023692
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,768,0.003956266740957896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,512,0.0039488000174363455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,1024,0.00408746674656868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,256,0.0035690667728583017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,128,0.003260799994071325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,64,0.0031360000371932983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,64,32,0.0032127998769283296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,65536,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,12288,0.00793280005455017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,16384,0.008280533552169799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,10240,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,8192,0.007046400010585785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,7168,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,6144,0.006702933212121327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,5120,0.0062943999965985615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,3584,0.006669866542021434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,4096,0.0061589335401852924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,3072,0.006227200229962667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,2560,0.0066997334361076355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,2048,0.005906133353710175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,1536,0.00481279989083608
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,1024,0.004469333092371622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,512,0.0036458666125933326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,768,0.004025600105524063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,256,0.0033088001112143196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,128,0.0032074667513370516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,64,0.003206400076548258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,32,32,0.003223466624816259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,10240,0.22743040720621743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,12288,0.26815147399902345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,16384,0.37092692057291665
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,6144,0.14267733891805012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,8192,0.18418347040812175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,7168,0.15811413129170734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,4096,0.09707520008087159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,5120,0.11560959815979004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,3584,0.08406506379445394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,2560,0.059903999169667564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,3072,0.07174932956695557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,2048,0.05156373182932535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,1536,0.039662933349609374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,1024,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,768,0.02251946727434794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,256,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,512,0.015783466895421348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,128,0.0058559998869895935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,32,0.005032533407211303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,65536,64,0.005266133447488149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,12288,0.062087468306223546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,16384,0.0867199977238973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,8192,0.04403306643168132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,10240,0.05461546579996744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,65536,0.34778451919555664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,7168,0.03843413194020589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,6144,0.033928533395131424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,5120,0.028943999608357744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,4096,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,3584,0.0216213325659434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,2560,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,2048,0.01362986663977305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,3072,0.01882879932721456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,1536,0.01120746632417043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,1024,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,768,0.0074325333038965866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,512,0.005406933526198069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,256,0.004564266900221507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,128,0.00407679999868075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,64,0.004030933231115341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,16384,32,0.00413973331451416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,12288,0.051438931624094644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,16384,0.0687445322672526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,8192,0.037206399440765384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,10240,0.04464426835378011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,65536,0.24950826962788902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,7168,0.0315391997496287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,6144,0.028497066100438433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,5120,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,4096,0.02012053330739339
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,3584,0.0181386669476827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,3072,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,2560,0.013901866475741067
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,2048,0.011925333738327026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,1024,0.007968000074227651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,1536,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,768,0.0063285330931345625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,512,0.004790399968624115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,128,0.004068266600370407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,256,0.004347733159859975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,64,0.004066133250792822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,12288,32,0.004040533304214477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,12288,0.040482131640116374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,16384,0.05437440077463786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,65536,0.21575679779052734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,8192,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,10240,0.035420799255371095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,6144,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,5120,0.020218666394551596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,7168,0.025601067145665485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,4096,0.016226133704185484
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,3584,0.014586666226387024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,3072,0.012755200266838074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,2560,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,2048,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,1536,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,1024,0.00598826656738917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,768,0.004994133114814758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,512,0.004523733258247375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,256,0.004218666752179464
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,128,0.0035968000690142312
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,32,0.003798400113979975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,10240,64,0.003730133424202601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,16384,0.04911786715189616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,65536,0.18384213447570802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,12288,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,10240,0.028535467386245728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,7168,0.020875734090805054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,6144,0.018681599696477254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,5120,0.016362667083740234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,4096,0.013438933094342551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,3072,0.01192639966805776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,2048,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,2560,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,1536,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,1024,0.00547626664241155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,512,0.004423466821511587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,768,0.0048991998036702475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,256,0.0039818666875362395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,128,0.003986133386691412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,64,0.0036757332583268487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,8192,32,0.0041002665956815084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,12288,0.037887998421986896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,16384,0.04669440189997355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,65536,0.16493226687113444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,10240,0.02764799992243449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,8192,0.022516266504923502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,7168,0.01993280053138733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,6144,0.017730132738749186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,4096,0.012813867131868998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,5120,0.015348266561826071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,3584,0.011718400319417318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,3072,0.01069760024547577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,2048,0.00858133335908254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,2560,0.009476266304651896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,1536,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,1024,0.005031466484069824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,768,0.004964266717433929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,512,0.004452266792456309
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,256,0.003977599988381068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,64,0.0036874666810035707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,128,0.0036373332142829893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,7168,32,0.004016000032424927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,12288,0.03242666721343994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,16384,0.04061866601308187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,65536,0.12458666960398357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,10240,0.028193066517512005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,8192,0.019577600558598838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,7168,0.019777067502339683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,6144,0.017866667111714682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,5120,0.015241600076357522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,4096,0.012812800208727517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,3584,0.011925333738327026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,2560,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,2048,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,3072,0.009750399986902874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,1024,0.004990933338801066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,1536,0.00584853341182073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,768,0.0045056000351905824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,512,0.004163199911514918
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,256,0.003957333415746689
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,128,0.003573333223660787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,64,0.0035616000493367515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,6144,32,0.0036650667587916053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,12288,0.027100799481074016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,16384,0.03420159816741943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,65536,0.10649600028991699
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,8192,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,10240,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,6144,0.013972266515096029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,5120,0.013356799880663553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,7168,0.0186901330947876
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,4096,0.011174399654070537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,3584,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,3072,0.009511466821034749
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,2560,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,2048,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,1536,0.005529599885145823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,1024,0.004675200084845225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,768,0.004434133569399515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,256,0.003980800012747447
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,128,0.003664000084002813
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,512,0.0041002665956815084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,64,0.0036202666660149893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,5120,32,0.003697066754102707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,16384,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,12288,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,65536,0.09280853271484375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,8192,0.01601599951585134
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,10240,0.019730132818222047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,7168,0.014082133769989014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,5120,0.011549866199493409
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,6144,0.012984533111254373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,4096,0.009819733103116353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,3584,0.009128533800443013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,3072,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,2048,0.005850666761398315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,1536,0.00544106662273407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,2560,0.007423999905586243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,1024,0.004710400104522705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,768,0.004281599819660187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,512,0.004009599983692169
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,256,0.0036415999134381616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,128,0.0035797332723935447
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,64,0.003272533416748047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,4096,32,0.0036831999818483984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,65536,0.0759114662806193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,12288,0.02046826680501302
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,16384,0.026283733050028485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,10240,0.017796266078948974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,8192,0.015542399883270264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,7168,0.013605333367983499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,6144,0.012572800119717916
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,5120,0.011139200131098429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,4096,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,3584,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,3072,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,2048,0.006192000210285186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,1536,0.004997333387533823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,2560,0.006779733300209046
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,768,0.004796800017356872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,1024,0.004529066880544027
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,512,0.00402453343073527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,256,0.003605333218971888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,128,0.003659733384847641
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,64,0.0036490666369597114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3584,32,0.0039018665750821433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,65536,0.06813013553619385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,12288,0.02007253368695577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,16384,0.024985599517822265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,8192,0.015610667069753012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,10240,0.01807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,7168,0.014457600315411887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,5120,0.01076586643854777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,6144,0.01209493378798167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,4096,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,3584,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,3072,0.007490133245786031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,1536,0.005323733389377594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,2048,0.005814399818579356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,2560,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,1024,0.00480320006608963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,768,0.0044159998496373495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,512,0.00408746674656868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,256,0.003868799904982249
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,128,0.0036117332677046456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,64,0.003253333270549774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,3072,32,0.0035061334570248926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,65536,0.05789013306299845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,12288,0.01889066696166992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,16384,0.02258239984512329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,10240,0.016908800601959227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,8192,0.014825600385665893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,7168,0.013653332988421122
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,6144,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,5120,0.009922132889429728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,3584,0.00793280005455017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,3072,0.007110400001207988
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,4096,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,2560,0.006223999957243601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,2048,0.0054058666030565895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,1536,0.00521066685517629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,1024,0.004827733337879181
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,768,0.004328533510367076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,512,0.003933866570393244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,256,0.0036298667391141256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,128,0.0035573333501815797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,32,0.003572266548871994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2560,64,0.003293866664171219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,65536,0.048504531383514404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,16384,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,12288,0.015414399902025857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,10240,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,8192,0.01262933313846588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,6144,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,7168,0.011867733796437581
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,5120,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,4096,0.008374399940172831
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,80,256,128,0.0034154665966828666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,3584,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,3072,0.007106133302052816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,2560,0.006260266900062561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,1024,0.004534400006135305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,2048,0.0054613331953684485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,1536,0.005277866621812185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,768,0.004377600053946177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,512,0.00409706657131513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,256,0.00367253323396047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,64,0.003310933212439219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,128,0.003435733417669932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,2048,32,0.0033418667813142145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,16384,0.01530346671740214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,65536,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,12288,0.01276586651802063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,10240,0.012267733613650005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,8192,0.011107200384140014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,7168,0.010103467106819152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,5120,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,6144,0.009064533313115438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,4096,0.008412800232569377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,3584,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,3072,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,2560,0.00589333325624466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,2048,0.00544213354587555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,1536,0.005194666484991709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,1024,0.0044714664419492085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,512,0.003994666785001755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,768,0.00448639988899231
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,256,0.003576533248027166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,128,0.003293866664171219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,64,0.0032768001159032187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,16384,0.012267733613650005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1536,32,0.0032640000184377036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,65536,0.027033599217732747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,12288,0.01076693336168925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,10240,0.01069760024547577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,8192,0.009101866682370504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,6144,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,7168,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,5120,0.008274133503437042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,3584,0.007012266914049785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,3072,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,4096,0.007701333363850911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,2560,0.006075733403364817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,2048,0.005406933526198069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,1536,0.004849066833655039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,1024,0.004463999966780345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,768,0.004171733558177948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,512,0.004004266609748204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,256,0.003605333218971888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,64,0.0032842665910720824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,128,0.0033386667569478357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,1024,32,0.003790933390458425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,65536,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,16384,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,10240,0.010289067029953003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,12288,0.009543466567993163
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,7168,0.008646399776140849
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,8192,0.008726400136947633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,6144,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,5120,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,4096,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,3584,0.007463466624418895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,3072,0.007111466427644093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,2048,0.005649066468079885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,2560,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,1536,0.004814933240413666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,1024,0.004389333228270212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,768,0.004080000023047129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,128,0.0033258666594823206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,256,0.003553066651026408
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,512,0.003651199986537298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,64,0.003304533412059148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,768,32,0.0032874666154384612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,65536,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,16384,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,12288,0.00925973355770111
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,10240,0.009539199868837993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,8192,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,7168,0.00790826678276062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,5120,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,6144,0.007863466441631318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,4096,0.0074976002176602675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,3072,0.007076266904671986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,2560,0.006704000135262807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,3584,0.007463466624418895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,2048,0.006267733375231425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,1536,0.00477866679430008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,1024,0.0043488000830014546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,768,0.004051200052102407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,512,0.0036778666079044344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,256,0.0036256000399589538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,128,0.003601066768169403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,64,0.003180799881617228
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,512,32,0.0032266666491826378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,16384,0.010288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,65536,0.015474133690198264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,10240,0.00787306676308314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,8192,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,12288,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,7168,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,6144,0.006985599795977275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,5120,0.0066336000959078475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,3584,0.006806399921576183
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,4096,0.006983466446399689
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,2560,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,3072,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,2048,0.00660159985224406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,1536,0.004790399968624115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,1024,0.00436160018046697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,512,0.0037087999284267426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,768,0.003909333298603693
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,128,0.0032650666932264962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,64,0.0031776001056035364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,256,0.0033770665526390077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,256,32,0.0031968000034491217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,16384,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,10240,0.00739519993464152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,65536,0.014484266440073649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,12288,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,8192,0.007114666700363159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,6144,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,7168,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,5120,0.006313600142796834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,4096,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,3584,0.006632533172766368
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,3072,0.006270933151245117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,2560,0.006611200173695882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,2048,0.0062613333264986675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,1536,0.004941866795221964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,1024,0.0043605332573254905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,512,0.0036127999424934386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,256,0.0035989334185918174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,768,0.004008533308903376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,128,0.003172266731659571
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,64,0.0031626666585604347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,128,32,0.0030986666679382324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,16384,0.007496533294518788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,65536,0.011526399850845337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,12288,0.007046400010585785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,10240,0.006701866785685222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,8192,0.006676266590754191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,6144,0.006502399841944377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,7168,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,5120,0.006737066805362702
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,4096,0.005973333120346069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,3584,0.0062943999965985615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,2560,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,3072,0.005938133100668589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,2048,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,1536,0.004844800134499868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,1024,0.004377600053946177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,768,0.003956266740957896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,512,0.003638399889071783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,256,0.0033887999753157297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,128,0.0032597333192825317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,32,0.0032138665517171226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,64,64,0.003176533430814743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,65536,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,16384,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,12288,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,8192,0.006705066561698914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,7168,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,10240,0.0064746667941411335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,6144,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,5120,0.006259199976921081
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,4096,0.006292266647020976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,3584,0.006268799801667531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,2560,0.006636799871921539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,3072,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,2048,0.0063285330931345625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,1536,0.00483840008576711
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,1024,0.0040501333773136135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,768,0.0038005332152048744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,512,0.0036618667344252265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,128,0.0032543999453385672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,64,0.0028437333802382152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,32,0.0032426667710145317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,64,32,256,0.003370666752258936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,8192,0.186845858891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,10240,0.2240821361541748
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,12288,0.2684927940368652
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,16384,0.37710507710774743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,5120,0.11492693424224854
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,6144,0.1401866594950358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,7168,0.15843839645385743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,4096,0.09714346726735433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,3072,0.07154346307118734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,3584,0.08383039633433023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,2560,0.0609279990196228
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,2048,0.05198506514231364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,1024,0.028195200363794963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,1536,0.03829546769460042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,512,0.015197867155075073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,768,0.02176533341407776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,128,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,256,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,64,0.007012266914049785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,65536,32,0.006980266670385997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,12288,0.06203413407007853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,16384,0.08721066315968831
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,10240,0.053179732958475744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,8192,0.04396373430887858
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,7168,0.037752532958984376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,65536,0.3483978589375814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,6144,0.03345066706339518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,5120,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,4096,0.023756800095240276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,3584,0.02102400064468384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,2560,0.016089600324630738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,3072,0.018899200359980266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,2048,0.013434666395187377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,1536,0.011107200384140014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,1024,0.008603733777999879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,512,0.005257600049177805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,768,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,256,0.004519466559092204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,128,0.003986133386691412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,64,0.003700266778469086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,16384,32,0.0036629334092140196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,16384,0.07492160002390544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,12288,0.050996267795562746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,10240,0.04437226851781209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,8192,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,65536,0.2554357369740804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,7168,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,6144,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,5120,0.02427306572596232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,4096,0.01986560026804606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,3584,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,2560,0.014381866653760275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,3072,0.01644266645113627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,2048,0.012403200070063274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,1536,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,1024,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,512,0.005241600175698599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,256,0.004561066627502441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,768,0.006266666452089946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,128,0.004130133241415024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,64,0.0036917333801587426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,12288,32,0.004078933348258337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,16384,0.05696959892908732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,12288,0.040701866149902344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,10240,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,65536,0.21323092778523764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,8192,0.029151999950408937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,7168,0.02573653260866801
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,6144,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,4096,0.01684053341547648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,5120,0.019922133286794028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,3584,0.014587733149528503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,3072,0.013160533706347146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,2560,0.011754666765530903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,1536,0.00858026643594106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,1024,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,2048,0.010294399658838908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,768,0.004995200037956238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,512,0.004507733384768168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,256,0.004092800120512644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,128,0.004025600105524063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,64,0.0036127999424934386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,10240,32,0.003833599885304769
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,12288,0.03857066631317139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,10240,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,16384,0.04843306541442871
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,65536,0.1810431957244873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,8192,0.023483733336130776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,7168,0.02086826761563619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,6144,0.018554667631785073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,5120,0.016235733032226564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,4096,0.013428266843159994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,3584,0.012437333663304646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,2560,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,3072,0.011935999989509583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,1536,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,1024,0.005448533097902933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,768,0.00517439991235733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,512,0.004463999966780345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,256,0.003986133386691412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,64,0.003704533229271571
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,128,0.0036949334045251214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,32,0.0036864000062147772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,16384,0.04491946697235107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,12288,0.03604480028152466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,65536,0.15592106183369953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,10240,0.031948800881703696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,7168,0.01936533252398173
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,6144,0.017191465695699057
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,4096,0.012436266740163167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,5120,0.015076266725858054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,3584,0.011558399597803751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,3072,0.010357333223025005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,2560,0.01009386678536733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,2048,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,1536,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,1024,0.005585066477457682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,768,0.004561066627502441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,512,0.004355200131734212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,256,0.0039893334110577905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,64,0.0035402665535608927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,128,0.0036373332142829893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,7168,32,0.0036042665441830954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,16384,0.03911679983139038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,65536,0.12287893295288085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,10240,0.027100799481074016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,8192,0.0231221338113149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,7168,0.020205867290496827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,6144,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,5120,0.01581653356552124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,4096,0.01264639993508657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,3584,0.011525332927703857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,3072,0.010834133625030518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,2560,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,1536,0.00584853341182073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,2048,0.0077002664407094315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,1024,0.0046623999873797095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,768,0.004824533561865489
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,256,0.004005333284536997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,512,0.004366933306058248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,128,0.0036586667100588477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,64,0.0035605333745479585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,6144,32,0.003659733384847641
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,16384,0.03583999872207642
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,65536,0.10714453061421711
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,12288,0.02621440092722575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,10240,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,8192,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,7168,0.018076799313227334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,6144,0.016578132907549538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,5120,0.014254933595657349
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,4096,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,3584,0.010738133390744527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,3072,0.010150399804115296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,2560,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,1536,0.005474133292833964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,2048,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,768,0.004542933404445648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,512,0.0040501333773136135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,1024,0.005019733309745788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,256,0.004009599983692169
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,128,0.003605333218971888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,64,0.0035573333501815797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,5120,32,0.0035402665535608927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,65536,0.08816640377044678
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,16384,0.028603732585906982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,12288,0.022052266200383506
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,7168,0.015337600310643514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,10240,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,8192,0.0160970667997996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,6144,0.014042666554450989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,5120,0.011285332838694255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,4096,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,3584,0.009331199526786804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,3072,0.008386133114496867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,2560,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,2048,0.005952000121275584
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,1536,0.005037866532802582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,768,0.004391466577847799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,1024,0.00451093316078186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,512,0.003952000041802724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,256,0.003914666672547659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,64,0.0032117334504922234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,128,0.003619199991226196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,4096,32,0.003562666724125544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,16384,0.025872000058492023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,12288,0.0197760005791982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,65536,0.07574186325073243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,8192,0.015611732999483744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,7168,0.014255999525388082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,10240,0.017619200547536216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,6144,0.013597866892814637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,5120,0.011148800452550251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,4096,0.009544533491134644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,3584,0.008785067001978557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,3072,0.007702399790287018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,2560,0.006714666883150737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,2048,0.005983999868233999
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,1536,0.004937600096066793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,768,0.004422399898370107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,1024,0.004588800172011057
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,512,0.0039594667653242745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,256,0.0036821333070596062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,64,0.0034442665676275887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,128,0.003517866631348928
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3584,32,0.0035306667288144433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,16384,0.022257065773010253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,65536,0.06802879969278972
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,12288,0.017388800779978432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,7168,0.013222400347391763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,8192,0.013914666573206582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,10240,0.015689599514007568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,6144,0.011994666854540507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,5120,0.010533333818117777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,4096,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,3584,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,3072,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,2560,0.0066442668437957765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,2048,0.006190933287143707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,1536,0.005038933455944061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,1024,0.004537599782148996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,768,0.004424533247947693
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,512,0.004054400076468786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,128,0.003619199991226196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,64,0.0032490665713946023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,256,0.0036821333070596062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,3072,32,0.0032992000381151833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,16384,0.02026559909184774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,65536,0.06099626620610556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,12288,0.015610667069753012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,8192,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,10240,0.014459733168284097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,7168,0.012219732999801636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,6144,0.011558399597803751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,5120,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,3584,0.008111999928951263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,3072,0.007293866574764251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,2560,0.006405333181222279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,2048,0.005448533097902933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,1536,0.0050335998336474095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,1024,0.004473599791526795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,768,0.004231466849644979
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,256,0.003671466559171677
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,512,0.0039061332742373147
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,128,0.0035743998984495797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,64,0.003222399950027466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,32,0.0032597333192825317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,16384,0.015894400080045064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,65536,0.04761600097020467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,12288,0.01541759967803955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,10240,0.014050133029619851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,8192,0.012411733468373615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,7168,0.011878400047620138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,6144,0.011115733782450359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,5120,0.009683199723561605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,4096,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,3584,0.007702399790287018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,3072,0.006604800124963124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,2048,0.005448533097902933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,2560,0.006198399762312571
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,1536,0.005303466816743215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,1024,0.004533333579699198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,768,0.004344533383846283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,512,0.003964799890915553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,256,0.0035445332527160645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,128,0.0035135999321937563
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,64,0.00322026660044988
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2048,32,0.0032927999893824257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,65536,0.036933334668477376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,12288,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,16384,0.015144532918930054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,10240,0.01193386713663737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,8192,0.010706133643786113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,7168,0.011512533823649088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,6144,0.01009173293908437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,5120,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,4096,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,3584,0.007050666709740956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,3072,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,2560,0.006233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,1536,0.004936533172925314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,2048,0.005379199981689453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,1024,0.004369066655635833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,768,0.004090666770935059
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,512,0.0039594667653242745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,256,0.0036298667391141256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,128,0.0032511999209721885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,64,0.0032479998966058097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1536,32,0.00325546662012736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,16384,0.012001066406567892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,65536,0.02648746569951375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,12288,0.012035199999809265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,10240,0.011148800452550251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,8192,0.010035199920336406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,7168,0.009205333391825358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,6144,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,4096,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,5120,0.008516266942024231
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,3584,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,3072,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,2560,0.0058229332168896995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,2048,0.005564799904823304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,1536,0.005202133456865946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,1024,0.004453333218892416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,768,0.004095999896526337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,256,0.0035775999228159585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,512,0.00401706670721372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,128,0.003257599969704946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,64,0.003323733309904734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,1024,32,0.0033130665620168054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,65536,0.02491733431816101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,16384,0.011692800124486287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,10240,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,12288,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,8192,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,7168,0.008746666709582011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,6144,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,5120,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,4096,0.007427200178305308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,3584,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,3072,0.006234666705131531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,2048,0.005415466427803039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,2560,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,1536,0.004744533201058706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,1024,0.004404266675313314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,768,0.004016000032424927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,512,0.004001066585381826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,256,0.0035743998984495797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,128,0.0032320000231266023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,64,0.0032597333192825317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,768,32,0.003218133250872294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,65536,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,12288,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,16384,0.010387200117111205
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,10240,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,8192,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,7168,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,6144,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,5120,0.008181333541870117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,4096,0.0074986666440963745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,3584,0.007049599786599477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,2560,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,3072,0.006983466446399689
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,2048,0.005312000215053558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,1536,0.00481279989083608
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,1024,0.004370133578777313
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,768,0.004071466624736786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,512,0.0036661334335803984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,256,0.003553066651026408
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,128,0.0031850665807724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,32,0.0032287999987602235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,512,64,0.0032586666444937387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,65536,0.015963733196258545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,16384,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,12288,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,10240,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,8192,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,7168,0.00790826678276062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,6144,0.007461333274841308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,5120,0.007396266857783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,4096,0.006985599795977275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,3584,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,3072,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,2048,0.006267733375231425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,2560,0.006679466863473256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,1536,0.0045962666471799215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,1024,0.004428799947102865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,768,0.004068266600370407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,512,0.0036458666125933326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,256,0.003573333223660787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,128,0.0032960000137488045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,64,0.00314026673634847
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,256,32,0.003197866678237915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,65536,0.014802133043607077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,8192,2048,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,12288,0.007803733150164287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,16384,0.008726400136947633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,10240,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,8192,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,7168,0.006611200173695882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,6144,0.006260266900062561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,5120,0.006131199995676676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,3584,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,4096,0.006267733375231425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,3072,0.005789866546789805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,2560,0.006223999957243601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,2048,0.005825066566467285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,1536,0.004642133414745331
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,1024,0.0040224000811576845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,512,0.003638399889071783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,768,0.003908266623814901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,256,0.0032490665713946023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,128,0.003202133377393087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,32,0.003101866692304611
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,128,64,0.003205333401759466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,16384,0.007963733375072479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,65536,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,12288,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,10240,0.007456000149250031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,8192,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,7168,0.0066453332702318835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,6144,0.006602666775385539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,5120,0.006200533111890157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,3584,0.006260266900062561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,4096,0.005757866799831391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,3072,0.005857066810131073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,2560,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,1536,0.00480320006608963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,2048,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,1024,0.0041354666153589886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,768,0.0039594667653242745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,512,0.0036821333070596062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,256,0.003550933301448822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,128,0.0032586666444937387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,32,0.0032511999209721885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,64,64,0.003193599979082743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,16384,0.007969066500663757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,65536,0.012001066406567892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,12288,0.007496533294518788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,10240,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,8192,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,7168,0.006611200173695882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,6144,0.00660159985224406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,5120,0.006232533355553945
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,3584,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,4096,0.005791999896367391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,3072,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,2560,0.0061941335598627726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,1536,0.004779733220736186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,2048,0.0057888001203536986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,1024,0.0043488000830014546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,768,0.003999999910593033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,512,0.0036821333070596062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,256,0.003252266595760981
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,128,0.0032117334504922234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,32,0.0032149332265059153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,32,64,0.0032586666444937387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,10240,0.22333547274271645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,16384,0.36519254048665367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,7168,0.15578346252441405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,8192,0.18452693621317545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,6144,0.1388213316599528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,5120,0.11305066744486492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,4096,0.09676799774169922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,3584,0.08120853106180827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,3072,0.06929066975911459
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,2560,0.05792320171991984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,2048,0.04802560011545817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,1536,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,1024,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,768,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,512,0.014050133029619851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,128,0.0066442668437957765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,256,0.008660266796747845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,64,0.006198399762312571
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,32,0.00631466656923294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,16384,0.08393279711405435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,65536,0.3412991841634115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,12288,0.05976106723149618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,10240,0.050551466147104894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,8192,0.04143786827723185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,7168,0.03686399857203166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,6144,0.032494932413101196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,5120,0.027717334032058717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,3584,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,3072,0.018147200345993042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,2560,0.015622400244077048
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,1536,0.010705066720644633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,2048,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,1024,0.008313600222269695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,768,0.007053866485754649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,512,0.0045962666471799215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,256,0.0040778666734695435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,128,0.003619199991226196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,64,0.0035818666219711304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,16384,32,0.003587199995915095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,16384,0.07093013127644857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,12288,0.052940801779429114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,65536,0.25197226206461587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,48,2560,4096,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,10240,0.045943466822306316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,8192,0.0380949338277181
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,7168,0.032494932413101196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,6144,0.029148799180984498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,4096,0.020528000593185425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,5120,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,3584,0.018488534291585288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,3072,0.016296533743540446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,2560,0.013605333367983499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,2048,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,1536,0.009874133268992107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,1024,0.00787306676308314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,512,0.00489279975493749
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,768,0.006212266782919565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,128,0.003942399968703588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,64,0.003537066777547201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,256,0.004088533421357473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,12288,32,0.0037280000746250153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,16384,0.06198720137278239
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,12288,0.04635200103123983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,65536,0.22108160654703773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,10240,0.040141868591308597
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,8192,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,7168,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,5120,0.020593067010243736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,6144,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,4096,0.016850133736928306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,3584,0.015610667069753012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,3072,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,2560,0.011694932977358501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,2048,0.011241599917411804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,1024,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,1536,0.009133866429328919
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,768,0.006082133452097575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,512,0.005266133447488149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,128,0.003991466760635376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,256,0.004074666649103165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,64,0.0035189333061377203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,10240,32,0.003643733263015747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,16384,0.05188266833623251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,12288,0.03242986599604289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,65536,0.16315627098083496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,8192,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,10240,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,7168,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,6144,0.018547199169794717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,5120,0.01589120030403137
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,3584,0.012265599767367045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,4096,0.01316373348236084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,3072,0.011149866382280986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,2560,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,1536,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,2048,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,1024,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,768,0.005038933455944061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,512,0.004473599791526795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,256,0.0039818666875362395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,128,0.0035061334570248926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,32,0.003435733417669932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,8192,64,0.0032501332461833954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,16384,0.04355520009994507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,65536,0.1503338654836019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,12288,0.032425600290298465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,10240,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,8192,0.024098134040832518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,7168,0.01876266598701477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,6144,0.016910932461420693
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,5120,0.014798933267593383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,4096,0.01213759978612264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,3584,0.0115146666765213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,3072,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,2560,0.009134933352470398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,2048,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,1536,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,768,0.004539733131726583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,1024,0.0054837331175804135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,512,0.004036266605059306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,256,0.0036490666369597114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,64,0.003532800078392029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,128,0.003555200000603994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,7168,32,0.003909333298603693
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,12288,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,16384,0.03774826526641846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,65536,0.11943253676096599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,8192,0.02177600065867106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,7168,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,6144,0.017729065815607705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,4096,0.01146986683209737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,5120,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,3584,0.010492799679438274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,3072,0.009475200374921163
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,2560,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,2048,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,1536,0.006233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,768,0.004491733511288961
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,1024,0.004752000172932943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,512,0.004065066576004028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,256,0.0037130666275819145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,128,0.0036245333651701607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,64,0.00322026660044988
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,6144,32,0.003365333378314972
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,12288,0.02635093331336975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,16384,0.034543999036153156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,65536,0.10697387059529621
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,10240,0.023212800423304238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,8192,0.020205867290496827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,7168,0.018011732896169027
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,6144,0.016293332974116007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,5120,0.014458666245142618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,3584,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,3072,0.00886079967021942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,4096,0.010637866457303365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,2560,0.008169599870840708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,2048,0.006621866424878438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,1536,0.005894400179386139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,1024,0.005268266797065735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,768,0.004740266501903534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,512,0.004387199878692627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,256,0.004019200056791306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,128,0.003634133438269297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,64,0.003173333406448364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,5120,32,0.00352960005402565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,65536,0.08874666690826416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,12288,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,16384,0.028398933013280232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,8192,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,10240,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,7168,0.014665599664052328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,6144,0.013702399532000222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,5120,0.012206932902336121
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,4096,0.011116799712181092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,3584,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,3072,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,2048,0.006192000210285186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,1536,0.004937600096066793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,2560,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,1024,0.004744533201058706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,768,0.004346666733423868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,512,0.004030933231115341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,256,0.004021333406368891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,128,0.0032842665910720824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,64,0.0032543999453385672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,4096,32,0.0032437334458033243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,65536,0.07311360041300455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,12288,0.01936639944712321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,16384,0.02525866627693176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,10240,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,8192,0.014826666315396628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,7168,0.01395093301932017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,6144,0.013060266772905985
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,5120,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,4096,0.010430933038393656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,3072,0.008669867118199667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,3584,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,2560,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,2048,0.006156800190607706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,1536,0.005120000243186951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,768,0.004013866682847341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,512,0.003929600119590759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,1024,0.0044938668608665465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,256,0.0036490666369597114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,128,0.0033930666744709016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,64,0.0032149332265059153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3584,32,0.0032757334411144257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,65536,0.06567466656366984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,16384,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,12288,0.017132800817489625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,10240,0.015554133057594299
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,7168,0.012846933801968894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,8192,0.013674666484196981
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,6144,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,5120,0.011241599917411804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,4096,0.008726400136947633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,3072,0.007479466497898102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,3584,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,2560,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,2048,0.005474133292833964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,1536,0.0046304002404212955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,768,0.004078933348258337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,512,0.004008533308903376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,1024,0.0044053331017494205
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,256,0.0036330667634805044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,128,0.003316266586383184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,64,0.003323733309904734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,3072,32,0.0034261333445707956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,65536,0.05655893484751383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,16384,0.020125865936279297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,12288,0.015473066767056783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,10240,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,7168,0.011969066659609477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,8192,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,6144,0.010990933577219645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,5120,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,4096,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,3584,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,3072,0.007283199826876323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,2560,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,2048,0.005380266904830932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,1536,0.005085866649945577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,512,0.004008533308903376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,768,0.004040533304214477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,1024,0.00446720023949941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,256,0.0036373332142829893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,128,0.0031658666829268134
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,64,0.003335466732581457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2560,32,0.003201066702604294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,65536,0.0464906652768453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,16384,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,12288,0.013361066579818726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,10240,0.012070399522781373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,7168,0.012356266379356384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,8192,0.01360640029112498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,6144,0.01153600017229716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,5120,0.010286933183670044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,4096,0.00913706620534261
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,3584,0.007053866485754649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,3072,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,2560,0.005861333509286245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,2048,0.005380266904830932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,1536,0.004916266600290934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,768,0.004025600105524063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,512,0.00395413339138031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,1024,0.004331733286380768
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,128,0.0035434665779272715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,256,0.0035402665535608927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,64,0.0031413334111372627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,2048,32,0.003324799984693527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,65536,0.03618133465449015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,16384,0.01712426741917928
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,12288,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,10240,0.013195733229319254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,8192,0.011525332927703857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,7168,0.010698666175206501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,6144,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,4096,0.008339200417200725
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,5120,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,3584,0.007053866485754649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,3072,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,2048,0.0055861334005991616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,2560,0.0058218667904535925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,1536,0.004896000027656555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,1024,0.004409599800904592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,768,0.0041002665956815084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,512,0.003651199986537298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,256,0.003551999976237615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,64,0.0031541332602500914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,128,0.0032640000184377036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1536,32,0.003272533416748047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,65536,0.026281599203745527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,16384,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,12288,0.01142080028851827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,10240,0.010357333223025005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,7168,0.008999466896057129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,8192,0.009410132964452107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,6144,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,5120,0.007463466624418895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,65536,12288,0.27019945780436194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,4096,0.007463466624418895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,3584,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,3072,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,2560,0.005886933207511902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,1536,0.005612800021966299
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,2048,0.006504533191521962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,1024,0.0048096001148223875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,768,0.0043935999274253845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,512,0.003907199949026108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,256,0.00365226666132609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,128,0.0035157332817713416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,64,0.003209600100914637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,1024,32,0.0033952000240484873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,16384,0.011959466338157653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,12288,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,65536,0.027784534295399982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,10240,0.00902400016784668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,7168,0.008684800068537394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,8192,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,5120,0.007522133489449819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,6144,0.007803733150164287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,4096,0.007828266421953837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,3584,0.007464533547560374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,3072,0.007112533350785573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,2560,0.007202133536338806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,2048,0.005407999952634176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,1536,0.0046304002404212955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,1024,0.004474666714668274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,512,0.00396373321612676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,256,0.003525333354870478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,768,0.004124800115823746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,128,0.003272533416748047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,64,0.003293866664171219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,768,32,0.003260799994071325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,16384,0.009942400455474853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,65536,0.02026346723238627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,12288,0.009128533800443013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,10240,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,8192,0.008682666222254436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,6144,0.007490133245786031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,7168,0.008283733328183492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,5120,0.007052800059318543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,4096,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,3584,0.007456000149250031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,3072,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,2560,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,2048,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,1536,0.004862933357556661
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,512,0.0037258667250474296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,768,0.00403413325548172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,1024,0.004411733150482178
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,256,0.0035936000446478524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,128,0.003554133325815201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,64,0.003138133386770884
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,512,32,0.0032992000381151833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,65536,0.015204266707102457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,16384,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,12288,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,8192,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,10240,0.00790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,7168,0.007112533350785573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,6144,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,5120,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,3584,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,4096,0.006680533289909363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,3072,0.006266666452089946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,2560,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,2048,0.006293333570162455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,1024,0.004244266450405121
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,768,0.0040287998815377556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,1536,0.004804266492525736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,512,0.0036831999818483984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,256,0.003565866748491923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,128,0.0031701333820819853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,64,0.003134933362404505
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,256,32,0.003286399940649668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,16384,0.007895466685295106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,65536,0.013979732990264893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,12288,0.0074976002176602675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,10240,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,8192,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,7168,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,5120,0.006704000135262807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,4096,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,6144,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,3584,0.006164266665776571
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,3072,0.0065194666385650635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,2560,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,1536,0.004907733201980591
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,1024,0.004376533130804697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,768,0.004001066585381826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,512,0.0036501333117485045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,256,0.0035391998787721
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,128,0.003147733211517334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,64,0.0031445334355036415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,32,0.003270400067170461
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,65536,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,16384,0.007394133508205414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,12288,0.007043200234572093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,10240,0.006466133395830791
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,8192,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,7168,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,6144,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,5120,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,4096,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,3584,0.006295466423034668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,3072,0.00589333325624466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,2560,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,2048,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,1536,0.004817066589991251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,1024,0.0044821331898371375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,768,0.0039327998956044516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,512,0.0035818666219711304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,256,0.003532800078392029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,128,0.0034111998975276947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,32,0.0031541332602500914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,64,64,0.00310506671667099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,65536,0.009128533800443013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,16384,0.007042133311430614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,10240,0.006670933465162914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,12288,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,8192,0.006258133550484974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,7168,0.006260266900062561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,6144,0.006200533111890157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,5120,0.0065994665026664736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,4096,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,3584,0.006540800134340922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,3072,0.00631466656923294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,2560,0.006189866860707601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,2048,0.0057888001203536986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,1024,0.004392533500989278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,768,0.003920000046491623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,512,0.0036618667344252265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,256,0.003188266605138779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,128,0.003256533294916153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,64,0.00322026660044988
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,32,0.00317546675602595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,12288,0.21998933156331382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,16384,0.33119678497314453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,8192,0.14786559740702312
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,10240,0.18432000478108723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,7168,0.1305941343307495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,6144,0.11274240016937256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,4096,0.07662826379140218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,5120,0.09574399789174398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,3072,0.058641068140665685
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,3584,0.06771946748097737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,2048,0.04116479953130086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,2560,0.0500490665435791
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,1536,0.032153600454330446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,1024,0.02308053374290466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,768,0.018480000893274943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,512,0.013572266697883606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,256,0.008582400282224019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,128,0.006234666705131531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,64,0.005884799857934316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,65536,32,0.006221866607666016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,16384,0.0988864024480184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,12288,0.07051946322123209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,65536,0.3323552131652832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,10240,0.06140586535135904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,8192,0.04280426502227783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,7168,0.03734079996744792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,6144,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,5120,0.028398933013280232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,4096,0.023209599653879802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,3584,0.02068586746851603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,3072,0.01840959986050924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,2048,0.013085866967837015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,2560,0.015895467003186545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,1536,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,1024,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,768,0.007011199990908305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,512,0.0041184000670909885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,256,0.003945599993069967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,128,0.003575466573238373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,64,0.0032778667906920114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,16384,32,0.0033290666838486993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,16384,0.06949439843495687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,65536,0.24418986638387047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,12288,0.05109759966532389
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,8192,0.037205334504445395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,10240,0.04437439839045207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,6144,0.029013333717981975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,7168,0.03249066670735677
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,5120,0.025600000222524004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,4096,0.021505065759023032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,3584,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,3072,0.017666133244832356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,2560,0.012743467092514038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,2048,0.010739200313886007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,1536,0.00960533320903778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,1024,0.007835733393828075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,768,0.00584853341182073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,512,0.004772266745567322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,256,0.0040501333773136135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,128,0.0036309334139029183
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,64,0.0035573333501815797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,12288,32,0.0035562666753927866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,16384,0.06475093364715576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,65536,0.20592640240987142
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,12288,0.046011734008789065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,10240,0.03925333420435588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,8192,0.0315391997496287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,7168,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,6144,0.026147200663884478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,5120,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,4096,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,3584,0.016910932461420693
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,3072,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,2560,0.012914133071899415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,2048,0.010309333602587383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,1536,0.009128533800443013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,1024,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,768,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,512,0.004971733192602793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,256,0.004392533500989278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,128,0.0037162666519482933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,64,0.0034677334129810332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,10240,32,0.0034933333595593774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,16384,0.04986879825592041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,65536,0.1614506721496582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,12288,0.032153600454330446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,10240,0.028331732749938963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,8192,0.022730666399002075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,7168,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,5120,0.016089600324630738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,6144,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,4096,0.013156267007191977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,3584,0.01200320025285085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,3072,0.011105066537857056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,2560,0.009646933277448018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,2048,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,1536,0.007085866729418437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,1024,0.005474133292833964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,768,0.00405973345041275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,512,0.003923200070858002
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,256,0.003587199995915095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,128,0.0036330667634805044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,64,0.003219199925661087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,8192,32,0.003222399950027466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,16384,0.0423253337542216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,65536,0.15121173858642578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,12288,0.031677865982055665
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,10240,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,8192,0.02327893376350403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,7168,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,6144,0.016773333152135216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,5120,0.014801067113876343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,4096,0.012266666690508524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,3584,0.011180800199508668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,3072,0.010219732920328777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,2048,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,2560,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,1536,0.006670933465162914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,1024,0.004700799783070883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,768,0.004357333481311798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,512,0.003937066594759623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,256,0.003656533360481262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,128,0.0032159999012947083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,64,0.0032543999453385672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,7168,32,0.0032597333192825317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,16384,0.037137067317962645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,65536,0.12779520352681478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,12288,0.028331732749938963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,10240,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,8192,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,7168,0.01918506622314453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,6144,0.01726079980532328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,5120,0.015273599823315939
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,3584,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,4096,0.011215999722480774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,3072,0.009533866246541341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,2560,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,2048,0.007353599866231282
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,1536,0.005415466427803039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,1024,0.004587733248869578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,768,0.00410453329483668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,512,0.0039594667653242745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,256,0.003571200122435888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,128,0.003504000107447306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,64,0.0032117334504922234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,6144,32,0.0033226666351159418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,16384,0.03461120128631592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,65536,0.10550613403320312
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,12288,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,10240,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,8192,0.019591466585795084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,7168,0.017464532454808553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,6144,0.015614933768908181
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,5120,0.014051199952761332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,4096,0.010630399982134501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,3584,0.009544533491134644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,3072,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,2560,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,2048,0.006614399949709575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,1536,0.0050346667567888895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,1024,0.004370133578777313
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,768,0.004057600100835165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,512,0.0037269333998362223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,128,0.003206400076548258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,256,0.0036245333651701607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,64,0.003289599965016047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,5120,32,0.0032074667513370516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,16384,0.02757973273595174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,65536,0.08584533532460531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,12288,0.020617600282033285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,10240,0.018637865781784058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,8192,0.01562346617380778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,7168,0.014452266693115234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,6144,0.013367467125256858
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,5120,0.012338133653004964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,3584,0.01120746632417043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,4096,0.012001066406567892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,3072,0.010150399804115296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,2560,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,2048,0.005714133381843567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,1536,0.004981333514054617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,1024,0.0042133331298828125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,768,0.004035199930270513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,512,0.003832533210515976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,256,0.003575466573238373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,128,0.0035157332817713416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,64,0.0032501332461833954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,4096,32,0.003553066651026408
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,16384,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,65536,0.07488853136698405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,12288,0.018910932540893554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,10240,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,8192,0.014451199769973755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,7168,0.013847466309865317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,6144,0.012812800208727517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,5120,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,4096,0.011942399541536967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,3584,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,3072,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,128,2048,0.006107733150323232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,2560,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,2048,0.0054058666030565895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,1024,0.004466133316357931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,768,0.004023466755946477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,1536,0.004851200183232625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,256,0.0036245333651701607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,512,0.0036085332433382668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,128,0.0033621333539485933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,64,0.003188266605138779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3584,32,0.0033674667278925574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,16384,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,12288,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,65536,0.06232853333155314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,10240,0.015205333630243937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,8192,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,7168,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,6144,0.011751466989517212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,5120,0.010807466506958009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,4096,0.010706133643786113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,3584,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,3072,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,2048,0.0053727999329566956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,1536,0.0046304002404212955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,2560,0.006505600114663441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,1024,0.0043818667531013485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,768,0.0040448000033696495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,512,0.003953066716591517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,256,0.0036864000062147772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,128,0.003221333275238673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,64,0.0032277333239714304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,3072,32,0.0031413334111372627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,65536,0.05550080140431722
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,12288,0.015304533640543619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,16384,0.019925334056218467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,8192,0.012642133235931396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,10240,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,32,32,1536,0.004781866570313772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,7168,0.01160533328851064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,6144,0.011108266313870747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,5120,0.01002346674601237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,4096,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,3584,0.009540266791979472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,3072,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,2560,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,2048,0.005690666536490122
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,1024,0.004420266548792521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,768,0.004030933231115341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,1536,0.004850133260091146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,512,0.003974399964014689
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,256,0.00360959991812706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,128,0.0033002667129039764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,32,0.0032927999893824257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2560,64,0.0031786667803923286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,65536,0.04539733330408732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,16384,0.015277866522471109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,12288,0.013243732849756875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,10240,0.012071466445922852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,8192,0.010785067081451416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,7168,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,6144,0.012405332922935487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,5120,0.011185066898663838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,4096,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,3584,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,3072,0.007010133564472198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,2048,0.005407999952634176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,2560,0.005858133236567179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,1024,0.004466133316357931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,1536,0.004676266511281332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,768,0.004106666644414266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,256,0.003659733384847641
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,128,0.0032810665667057036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,512,0.003752533346414566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,64,0.0031818665564060213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,2048,32,0.0031648000081380212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,65536,0.03645439942677815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,16384,0.013673599561055502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,12288,0.016771199305852254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,10240,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,8192,0.013128532965977987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,6144,0.011107200384140014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,7168,0.012356266379356384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,5120,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,4096,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,3584,0.007387733459472657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,2560,0.006155733267466227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,3072,0.006983466446399689
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,2048,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,1536,0.004857600231965383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,1024,0.004408533374468485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,768,0.004101333270470301
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,512,0.003861333429813385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,256,0.003532800078392029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,128,0.0035360001027584078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,32,0.0032597333192825317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1536,64,0.003202133377393087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,65536,0.025462400913238526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,16384,0.014812800288200378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,12288,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,8192,0.010289067029953003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,7168,0.009944533308347065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,10240,0.011116799712181092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,6144,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,5120,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,4096,0.00786240001519521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,3584,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,3072,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,2560,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,2048,0.006804266571998596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,1536,0.005756799876689911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,768,0.004390400151411692
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,1024,0.0046623999873797095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,512,0.00411520004272461
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,128,0.00345920001467069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,64,0.003176533430814743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,32,0.003294933338960012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,1024,256,0.003634133438269297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,16384,0.01276586651802063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,65536,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,12288,0.01076586643854777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,10240,0.009956266482671101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,7168,0.008923733234405517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,8192,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,6144,0.008272000153859456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,5120,0.00790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,4096,0.007524266839027405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,3072,0.007111466427644093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,3584,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,2048,0.00544106662273407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,2560,0.006611200173695882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,1536,0.005317333340644837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,1024,0.004642133414745331
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,768,0.0044149334232012425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,256,0.0035125332574049628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,128,0.0032042667269706728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,512,0.004016000032424927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,64,0.0032842665910720824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,768,32,0.003324799984693527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,65536,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,16384,0.011526399850845337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,12288,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,10240,0.008274133503437042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,8192,0.008624000350634257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,6144,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,7168,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,5120,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,4096,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,3584,0.007383466760317485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,2560,0.0067007998625437425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,3072,0.007048533360163371
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,2048,0.006267733375231425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,1536,0.004867200056711833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,1024,0.004391466577847799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,768,0.003987200061480204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,512,0.003651199986537298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,256,0.0035242666800816857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,128,0.0032629333436489105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,32,0.003189333279927572
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,512,64,0.003180799881617228
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,65536,0.01609280010064443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,16384,0.009262933333714803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,12288,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,8192,0.007418666779994964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,7168,0.007112533350785573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,10240,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,6144,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,5120,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,4096,0.007042133311430614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,3584,0.006607999900976817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,3072,0.006268799801667531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,2560,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,2048,0.0063274666666984555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,1536,0.004850133260091146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,1024,0.004413866500059763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,768,0.004012800008058548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,512,0.0036256000399589538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,64,0.003291733314593633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,128,0.0032874666154384612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,256,0.003573333223660787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,256,32,0.003206400076548258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,65536,0.014074666301409402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,16384,0.00787306676308314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,10240,0.007522133489449819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,12288,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,8192,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,7168,0.0066431999206542965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,6144,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,5120,0.006301866471767425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,4096,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,3584,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,3072,0.0063274666666984555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,2048,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,2560,0.006201600035031637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,1024,0.0044725333650906885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,1536,0.00476800004641215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,768,0.004048000027736028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,256,0.0034688000877698263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,128,0.0031925333042939507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,512,0.0035594666997591654
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,64,0.0031114667654037476
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,128,32,0.003236266722281774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,65536,0.011115733782450359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,16384,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,12288,0.006705066561698914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,10240,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,8192,0.006263466676076253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,6144,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,7168,0.006605866551399231
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,5120,0.00660159985224406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,4096,0.0057888001203536986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,3584,0.006295466423034668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,2560,0.006632533172766368
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,3072,0.005825066566467285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,2048,0.005858133236567179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,1536,0.0047189335028330484
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,1024,0.004413866500059763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,768,0.004014933357636133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,256,0.003253333270549774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,512,0.003570133447647095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,128,0.003256533294916153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,32,0.0031338666876157125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,64,64,0.0028757333755493166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,65536,0.009476266304651896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,16384,0.007043200234572093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,12288,0.006704000135262807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,8192,0.005757866799831391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,7168,0.007111466427644093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,6144,0.006227200229962667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,5120,0.005858133236567179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,4096,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,3584,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,3072,0.005781333148479462
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,2560,0.006259199976921081
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,2048,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,1536,0.004789333542188009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,1024,0.004456533491611481
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,768,0.003978666663169861
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,256,0.0034933333595593774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,512,0.0034613333642482757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,128,0.0032287999987602235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,64,0.003311999887228012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,32,0.0031040000418821974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,10240,0.20626773834228515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,16384,0.33488105138142904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,12288,0.2430037339528402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,8192,0.14718292554219564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,7168,0.1300821304321289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,6144,0.11201173464457195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,4096,0.07598079840342203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,5120,0.09523093700408936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,3584,0.06707200209299723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,2560,0.049561599890391037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,3072,0.05816320180892944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,2048,0.040482131640116374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,768,0.018413867553075156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,1536,0.031880533695220946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,512,0.013427199920018515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,256,0.008553600311279297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,128,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,64,0.005789866546789805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,32,0.005814399818579356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,16384,0.09683519999186198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,65536,0.32880640029907227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,12288,0.0691210667292277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,10240,0.05942720174789429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,8192,0.04973440170288086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,7168,0.03618133465449015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,6144,0.031675734122594196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,5120,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,4096,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,3584,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,3072,0.018003199497858682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,2560,0.015553067127863566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,2048,0.013223466277122498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,1536,0.010705066720644633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,1024,0.0086816002925237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,512,0.0045855998992919925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,256,0.003918933371702829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,128,0.0036170666416486105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,64,0.003253333270549774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,32,0.003504000107447306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,65536,0.2387989362080892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,16384,0.07188586393992105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,12288,0.05058559974034628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,10240,0.04396373430887858
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,8192,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,7168,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,6144,0.02867199977238973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,5120,0.02525866627693176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,4096,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,3584,0.019434666633605956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,3072,0.017339734236399333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,2560,0.015464533368746439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,2048,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,1536,0.008992000420888265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,1024,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,768,0.004997333387533823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,512,0.003952000041802724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,256,0.003610666592915853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,128,0.003553066651026408
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,64,0.003302400062481562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,12288,32,0.0034154665966828666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,65536,0.20264959335327148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,16384,0.062259201208750406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,12288,0.043212799231211345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,10240,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,8192,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,7168,0.028535467386245728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,6144,0.02553173303604126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,3584,0.017717333634694417
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,3072,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,2560,0.012471466263135274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,2048,0.010866133371988933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,1536,0.008992000420888265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,1024,0.006770133475462596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,768,0.0054730668663978575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,512,0.004962133367856344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,256,0.0036778666079044344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,128,0.0036085332433382668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,64,0.0032255999743938447
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,10240,32,0.0032992000381151833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,65536,0.16179413795471193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,16384,0.05048213402430216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,12288,0.032085333267847696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,10240,0.02757973273595174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,8192,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,6144,0.01827733318010966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,5120,0.01588586668173472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,4096,0.012882133324941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,3584,0.011991467078526814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,3072,0.010957866907119751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,2560,0.009763200084368389
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,2048,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,1536,0.007272533575693766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,1024,0.004615466793378194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,768,0.00417493333419164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,512,0.0039893334110577905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,256,0.0037418665985266366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,128,0.0035114665826161706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,64,0.0031829332311948144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,8192,32,0.0035285333792368567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,65536,0.1421994686126709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,16384,0.04109653234481812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,12288,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,10240,0.02744320034980774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,8192,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,7168,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,6144,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,5120,0.014658133188883463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,4096,0.012119467059771221
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,3584,0.011471999684969585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,3072,0.010219732920328777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,2560,0.009193600217501322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,2048,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,1536,0.006293333570162455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,1024,0.004691199958324432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,768,0.003993600110212962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,512,0.003931733220815659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,256,0.003770666569471359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,128,0.0032127998769283296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,64,0.0032170665760835014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,7168,32,0.0032106667757034303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,65536,0.12404053211212158
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,16384,0.03891199827194214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,12288,0.02949013312657674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,10240,0.024985599517822265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,8192,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,7168,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,6144,0.01718399922053019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,5120,0.015409066279729208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,4096,0.011368532975514729
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,3584,0.010377599795659383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,3072,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,2560,0.008714666962623597
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,2048,0.007146666447321574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,1536,0.005849599838256836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,1024,0.0047199999292691554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,768,0.003942399968703588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,512,0.0039893334110577905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,256,0.0035434665779272715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,128,0.003562666724125544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,64,0.00317546675602595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,6144,32,0.003201066702604294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,65536,0.10369706948598226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,16384,0.03372373183568318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,12288,0.025571199258168538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,10240,0.02191466689109802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,8192,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,7168,0.017182934284210204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,6144,0.015613866845766702
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,5120,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,4096,0.010685867071151734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,3584,0.00976213316122691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,3072,0.008990933497746784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,2560,0.00803306649128596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,2048,0.006589866677920024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,1536,0.0054400001962979635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,1024,0.004434133569399515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,768,0.0040949332217375435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,512,0.003918933371702829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,256,0.0036629334092140196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,128,0.0035285333792368567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,64,0.003230933348337809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,65536,1024,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,5120,32,0.0033589333295822145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,16384,0.027033599217732747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,65536,0.08386560281117758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,12288,0.021093332767486574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,10240,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,8192,0.015545599659283958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,7168,0.014450132846832275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,6144,0.01349440018335978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,5120,0.012061867117881774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,4096,0.01090239981810252
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,3584,0.011174399654070537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,3072,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,2560,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,2048,0.007796266674995422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,1536,0.006428800026575724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,768,0.004621866842110952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,1024,0.005438933273156484
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,512,0.004392533500989278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,256,0.00360000009338061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,128,0.0032543999453385672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,64,0.0031957333286603295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,4096,32,0.003270400067170461
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,65536,0.07331840197245279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,16384,0.023961599667867026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,12288,0.018478933970133463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,10240,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,16384,768,0.0070154666900634766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,8192,0.014313600460688271
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,7168,0.013699199755986533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,6144,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,5120,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,4096,0.01067200005054474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,3584,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,2560,0.008237866560618083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,3072,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,2048,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,1536,0.006188799937566122
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,1024,0.005221333106358846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,768,0.004762666424115499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,512,0.004905599852403005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,256,0.0036501333117485045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,64,0.003171200056870779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,32,0.003257599969704946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,16384,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,65536,0.06372586488723755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,12288,0.016839466492335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,10240,0.015204266707102457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,8192,0.01325653294722239
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,7168,0.012333866953849793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,6144,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,5120,0.010831999778747558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,4096,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,3584,0.009467732906341553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,3072,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,2560,0.007417599856853485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,2048,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,1536,0.006190933287143707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,1024,0.005362133185068766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,768,0.004655999938646952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,256,0.004005333284536997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,512,0.0043818667531013485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,128,0.0032618666688601174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,64,0.003239466746648153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3072,32,0.003209600100914637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,65536,0.054579198360443115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,16384,0.01997973322868347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,12288,0.015131733814875283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,10240,0.01397119959195455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,8192,0.012423466642697651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,7168,0.011618133385976155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,6144,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,5120,0.009966933727264404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,4096,0.00871573289235433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,3584,0.007964799801508587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,3072,0.008138666550318401
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,2560,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,2048,0.006293333570162455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,1536,0.006192000210285186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,1024,0.005308799942334493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,768,0.004554666578769684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,512,0.004175999760627746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,256,0.004043733328580856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,128,0.0032597333192825317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,64,0.0032490665713946023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2560,32,0.003188266605138779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,65536,0.04478293259938558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,16384,0.015339733163515726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,12288,0.012949333588282267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,10240,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,8192,0.011549866199493409
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,7168,0.010762666662534077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,6144,0.009942400455474853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,5120,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,4096,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,3584,0.00793280005455017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,3072,0.006705066561698914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,2560,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,2048,0.007012266914049785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,1536,0.005865600208441416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,1024,0.005050666630268097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,768,0.0048767998814582825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,512,0.004045866678158442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,256,0.0036906667053699495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,128,0.00360000009338061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,64,0.003302400062481562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,2048,32,0.0032586666444937387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,65536,0.03508906761805217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,16384,0.013562666376431784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,12288,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,10240,0.014999467134475707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,8192,0.012355200449625651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,7168,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,6144,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,5120,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,4096,0.00820479989051819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,3584,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,2560,0.005884799857934316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,3072,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,2048,0.0062613333264986675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,1536,0.005438933273156484
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,1024,0.004840533435344696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,768,0.004308266441027323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,512,0.003993600110212962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,256,0.0035466666022936503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,128,0.0035797332723935447
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,64,0.003092266619205475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1536,32,0.0034272000193595886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,65536,0.025326933463414508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,16384,0.014517333110173544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,12288,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,10240,0.011108266313870747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,8192,0.010288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,7168,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,6144,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,5120,0.007524266839027405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,4096,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,3584,0.007077333331108093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,3072,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,2560,0.005850666761398315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,2048,0.006632533172766368
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,1536,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,1024,0.004910933474699656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,768,0.004369066655635833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,512,0.004063999901215235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,256,0.0038922667503356934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,128,0.00352960005402565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,64,0.00323840007185936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,1024,32,0.0031776001056035364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,65536,0.0211626668771108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,16384,0.012880000472068786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,12288,0.010969600081443787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,10240,0.009876267115275065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,8192,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,7168,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,6144,0.0074869334697723385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,5120,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,4096,0.007417599856853485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,3584,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,3072,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,2560,0.007043200234572093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,2048,0.005400533477465311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,1536,0.005067733426888784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,1024,0.004625066618124644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,768,0.004286933441956838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,512,0.003958400090535482
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,256,0.0035061334570248926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,128,0.0035455999275048576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,64,0.0032469332218170166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,768,32,0.0031914666295051576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,65536,0.022984532515207927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,16384,0.01146986683209737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,12288,0.00909440020720164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,10240,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,8192,0.008339200417200725
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,7168,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,6144,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,5120,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,4096,0.0074527998765309645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,3584,0.007114666700363159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,3072,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,2560,0.006636799871921539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,2048,0.006279466549555461
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,1536,0.004710400104522705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,1024,0.004353066782156626
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,768,0.004065066576004028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,512,0.0037205333511034647
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,256,0.0036320000886917113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,128,0.0032650666932264962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,64,0.0032405334214369455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,512,32,0.0032511999209721885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,65536,0.016088533401489257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,16384,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,12288,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,10240,0.007863466441631318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,8192,0.007041066884994507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,7168,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,6144,0.006602666775385539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,5120,0.0066336000959078475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,4096,0.006636799871921539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,3584,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,3072,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,2560,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,2048,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,1536,0.004849066833655039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,1024,0.004335999985535939
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,768,0.004067199925581614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,512,0.003651199986537298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,256,0.003651199986537298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,128,0.0032640000184377036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,64,0.003294933338960012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,256,32,0.0032106667757034303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,65536,0.014107732971509298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,16384,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,12288,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,10240,0.007076266904671986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,8192,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,7168,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,6144,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,5120,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,4096,0.006223999957243601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,3584,0.006227200229962667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,3072,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,2560,0.006227200229962667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,1536,0.004676266511281332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,2048,0.0062943999965985615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,1024,0.004049066702524821
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,768,0.00402453343073527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,512,0.0036277333895365395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,256,0.003502933432658514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,128,0.0032117334504922234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,64,0.0031957333286603295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,128,32,0.0031637333333492277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,65536,0.011175466577212016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,16384,0.007112533350785573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,12288,0.006908800204594929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,10240,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,8192,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,7168,0.006260266900062561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,6144,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,5120,0.005884799857934316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,4096,0.006260266900062561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,3584,0.0062943999965985615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,3072,0.006223999957243601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,2560,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,2048,0.006221866607666016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,1536,0.00477866679430008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,1024,0.004315733412901561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,768,0.0039434666434923805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,512,0.0037791999677817024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,256,0.0032287999987602235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,128,0.003269333392381668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,64,0.0031541332602500914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,64,32,0.003230933348337809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,16,32,10240,0.006266666452089946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,65536,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,16384,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,10240,0.006636799871921539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,8192,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,12288,0.006268799801667531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,7168,0.006287999947865804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,6144,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,5120,0.005939200023810069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,4096,0.005493333439032236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,3584,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,3072,0.005750399827957153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,2560,0.005851733187834421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,2048,0.005849599838256836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,1024,0.00417493333419164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,768,0.004012800008058548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,1536,0.004756266872088114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,512,0.0036138666172822317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,256,0.003570133447647095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,128,0.003239466746648153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,64,0.003091199944416682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,32,32,0.003278933217128118
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,10240,0.20237439473470054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,12288,0.24021973609924316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,16384,0.32771412531534827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,8192,0.16561493873596192
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,7168,0.1458175977071126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,6144,0.12840960025787354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,4096,0.08144213358561198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,5120,0.10857280095418294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,3584,0.07081706523895263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,3072,0.061610666910807285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,2560,0.05239466826121012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,2048,0.041988265514373777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,1024,0.02362026572227478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,1536,0.03338239987691243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,768,0.01841920018196106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,256,0.008759466807047527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,512,0.01363200048605601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,128,0.006201600035031637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,64,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,65536,32,0.006132266422112783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,12288,0.06775573094685873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,16384,0.09495893319447836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,10240,0.058606934547424314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,8192,0.04952746629714966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,65536,0.32624638875325523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,6144,0.032017066081364946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,7168,0.03618133465449015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,5120,0.02791999975840251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,4096,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,3584,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,3072,0.018080000082651773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,2048,0.013255467017491659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,2560,0.01564479966958364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,768,0.007011199990908305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,1024,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,1536,0.010921600461006164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,512,0.004677333434422811
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,256,0.004021333406368891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,128,0.0036309334139029183
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,64,0.0033557333052158357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,16384,32,0.0035562666753927866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,16384,0.07167999744415283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,12288,0.052292267481486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,10240,0.04498773415883382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,8192,0.038024532794952395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,65536,0.23490559260050453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,7168,0.033587201436360674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,6144,0.028875732421875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,5120,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,8,3584,128,0.0033226666351159418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,4096,0.02209706703821818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,3584,0.019435733556747437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,3072,0.017598932981491087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,2048,0.010968533158302308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,2560,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,1536,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,1024,0.007086933155854543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,768,0.005339733262856802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,256,0.0036330667634805044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,512,0.004337066908677419
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,64,0.0032661333680152893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,32,0.003319466610749563
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,12288,128,0.003626666714747747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,16384,0.06103039979934692
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,12288,0.04396373430887858
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,10240,0.03809279998143514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,65536,0.197324800491333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,8192,0.03174399932225545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,7168,0.028467200199762982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,5120,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,6144,0.025653332471847534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,4096,0.018755199511845906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,3584,0.01781866749127706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,3072,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,2560,0.011935999989509583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,2048,0.011447466413180033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,1536,0.008921600381533305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,1024,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,512,0.005099733173847198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,256,0.003700266778469086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,768,0.006164266665776571
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,128,0.0035232000052928926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,64,0.0032618666688601174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,10240,32,0.003606399893760681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,16384,0.048401065667470294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,12288,0.03331413269042969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,10240,0.027716267108917236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,65536,0.1591978708902995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,8192,0.023140267531077067
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,7168,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,6144,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,5120,0.016302933295567833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,3584,0.012332800030708312
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,4096,0.013640532890955607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,3072,0.011210667093594869
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,2048,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,1536,0.007156266768773396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,2560,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,1024,0.004996266464392344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,768,0.004454400142033895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,512,0.004010666658480962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,128,0.0035690667728583017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,256,0.003549866626660029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,64,0.003218133250872294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,8192,32,0.003236266722281774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,16384,0.0423253337542216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,12288,0.03297599951426188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,10240,0.028125866254170732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,65536,0.14076587359110515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,7168,0.021826134125391642
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,8192,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,6144,0.016851200660069784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,5120,0.014455466469128927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,4096,0.01267413298288981
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,2560,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,3072,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,3584,0.011557333668073018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,2048,0.0081045334537824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,1536,0.006702933212121327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,1024,0.004628266890843709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,768,0.004385066529115042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,512,0.004041599979003271
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,256,0.0035978667438030243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,128,0.003385599950949351
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,32,0.0031648000081380212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,7168,64,0.003257599969704946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,16384,0.03863893349965413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,12288,0.03051519989967346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,65536,0.12284586429595948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,10240,0.025396267573038738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,8192,0.020808533827463786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,7168,0.019639466206232706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,6144,0.017181867361068727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,5120,0.015552000204722086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,4096,0.01118293305238088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,3584,0.01042560040950775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,3072,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,2048,0.0074976002176602675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,1536,0.005678933362166087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,2560,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,1024,0.004515199859937032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,512,0.003984000037113826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,768,0.0040522667268912
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,256,0.00360959991812706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,128,0.0032437334458033243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,64,0.0032885332902272543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,6144,32,0.0033749334514141084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,16384,0.03392746845881144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,12288,0.026555732885996504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,10240,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,65536,0.10274133682250977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,8192,0.019368533293406168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,7168,0.017593600352605186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,6144,0.015620266397794088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,5120,0.014014933506647745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,4096,0.010665599505106609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,3584,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,3072,0.00886293351650238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,2048,0.006361599763234456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,1536,0.004997333387533823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,2560,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,1024,0.004327466587225596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,768,0.004410666724046072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,512,0.0039818666875362395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,128,0.0032416000962257386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,256,0.0035594666997591654
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,32,0.003271466741959254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,16384,0.028602667649586994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,12288,0.02225386699040731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,65536,0.08564053376515707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,8192,0.0162282665570577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,7168,0.014939733346303306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,10240,0.019035732746124266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,6144,0.013699199755986533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,5120,0.012345600128173827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,4096,0.01125333309173584
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,3584,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,3072,0.009885866443316143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,2560,0.008727467060089112
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,2048,0.007524266839027405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,1536,0.006233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,768,0.004689066608746847
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,1024,0.006007466713587443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,512,0.0044383997718493145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,256,0.0035807999471823373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,64,0.00311253344019254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,128,0.0031914666295051576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,4096,32,0.0032000000278155005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,16384,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,65536,0.07581013043721517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,12288,0.01945599913597107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,7168,0.013699199755986533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,8192,0.014801067113876343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,10240,0.016711467504501344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,6144,0.012573867042859396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,5120,0.011796266833941142
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,4096,0.010774399836858113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,3584,0.01076693336168925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,3072,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,2560,0.008521599570910136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,2048,0.007045333087444305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,1536,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,768,0.005190399785836538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,1024,0.0054837331175804135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,512,0.0058559998869895935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,256,0.00360959991812706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,64,0.003186133255561193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,128,0.003328000009059906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3584,32,0.0033130665620168054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,65536,0.06573973496754965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,16384,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,12288,0.017661867539087932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,10240,0.015210666259129844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,7168,0.012812800208727517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,8192,0.013434666395187377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,5120,0.01083626647790273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,6144,0.011526399850845337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,4096,0.009545600414276123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,3584,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,3072,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,2560,0.007701333363850911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,2048,0.0063296000162760425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,1536,0.006200533111890157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,768,0.004711466530958811
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,512,0.004540800054868063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,1024,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,256,0.0039488000174363455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,128,0.0031328000128269195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,64,0.0030954666435718536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,3072,32,0.0031957333286603295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,65536,0.05812906821568807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,16384,0.02026346723238627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,12288,0.015476266543070475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,10240,0.01425386667251587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,7168,0.011548800269762675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,8192,0.01269760032494863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,6144,0.010854400197664897
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,5120,0.010220799843470256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,4096,0.008932266632715862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,3072,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,3584,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,2048,0.006297599772612255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,2560,0.0076682666937510175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,1536,0.006200533111890157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,1024,0.005118933320045471
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,512,0.004515199859937032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,768,0.005169066786766052
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,256,0.003962666789690653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,128,0.0032768001159032187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,64,0.003142400085926056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2560,32,0.003206400076548258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,65536,0.048742401599884036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,12288,0.013150933384895324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,16384,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,10240,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,8192,0.011550933122634888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,7168,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,6144,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,5120,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,4096,0.00787306676308314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,3584,0.007053866485754649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,3072,0.006636799871921539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,1536,0.005884799857934316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,2048,0.006950399776299794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,2560,0.006234666705131531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,1024,0.00496319979429245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,768,0.00452693353096644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,512,0.00448639988899231
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,256,0.003994666785001755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,128,0.0035274667044480645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,64,0.0032074667513370516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,2048,32,0.0032661333680152893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,65536,0.035499731699625656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,12288,0.01165120005607605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,16384,0.013877333203951518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,10240,0.014662399888038635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,8192,0.013597866892814637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,7168,0.011741866668065388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,6144,0.011059199770291645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,5120,0.008137600123882293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,3584,0.00739519993464152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,4096,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,3072,0.006671999891599019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,2560,0.006200533111890157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,1536,0.005406933526198069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,2048,0.006382933259010315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,1024,0.004711466530958811
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,768,0.004379733403523763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,512,0.0040778666734695435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,128,0.003517866631348928
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,64,0.003239466746648153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,32,0.003306666761636734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,16384,0.014382933576901754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,65536,0.025804799795150758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,12288,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,10240,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,8192,0.010152533650398254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,6144,0.007895466685295106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,7168,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,5120,0.007457066575686138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,4096,0.007461333274841308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,3584,0.007046400010585785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,3072,0.0066442668437957765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,2560,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,1536,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,2048,0.00664213349421819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,1024,0.004653866589069367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,768,0.0049098665515581764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,512,0.004387199878692627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,256,0.0036864000062147772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,128,0.0035807999471823373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,32,0.0032458665470282235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1024,64,0.0032458665470282235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,65536,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,16384,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,12288,0.010834133625030518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,10240,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,8192,0.00947093367576599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,6144,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,7168,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,5120,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,4096,0.007462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,3584,0.007147733370463054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,3072,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,2560,0.006568533182144165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,1536,0.005407999952634176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,2048,0.005346133311589559
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,1024,0.00481279989083608
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,768,0.004474666714668274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,512,0.003987200061480204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,256,0.0035391998787721
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,128,0.0035264000296592714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,32,0.003236266722281774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,768,64,0.0031744000812371576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,65536,0.024851200977961223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,16384,0.011538133025169373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,12288,0.008718933661778767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,10240,0.008212266862392426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,8192,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,6144,0.007441066702206929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,5120,0.007011199990908305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,4096,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,3584,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,3072,0.006737066805362702
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,2560,0.00660159985224406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,2048,0.0062613333264986675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,1536,0.004647466540336609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,1024,0.004145066688458125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,768,0.003787733366092046
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,512,0.0037802666425704955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,256,0.0036608000596364343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,128,0.0032746667663256326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,64,0.0031178665657838186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,32,0.003289599965016047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,65536,0.01628373364607493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,16384,0.008719999591509502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,12288,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,10240,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,8192,0.007218133409818013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,7168,0.00697813332080841
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,6144,0.006602666775385539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,5120,0.006259199976921081
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,4096,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,3584,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,3072,0.006227200229962667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,2560,0.006227200229962667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,2048,0.005850666761398315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,1536,0.004654933512210846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,1024,0.004197333256403605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,768,0.003857066730658213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,512,0.003568000098069509
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,256,0.0035743998984495797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,128,0.0031968000034491217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,64,0.0031744000812371576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,256,32,0.0032138665517171226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,65536,0.014166399836540222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,16384,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,12288,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,10240,0.007418666779994964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,8192,0.007012266914049785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,7168,0.006667733192443848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,6144,0.006602666775385539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,5120,0.0061930666367212926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,4096,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,3584,0.006227200229962667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,3072,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,2560,0.006189866860707601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,2048,0.005816533168156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,1536,0.004554666578769684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,1024,0.00412266676624616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,768,0.003957333415746689
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,512,0.0036650667587916053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,256,0.0031680000325044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,128,0.0031413334111372627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,64,0.0031306666632493338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,128,32,0.003125333289305369
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,65536,0.010786133011182149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,16384,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,12288,0.0066336000959078475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,10240,0.006295466423034668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,8192,0.006600533425807953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,7168,0.0062613333264986675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,6144,0.006227200229962667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,5120,0.005851733187834421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,4096,0.00547626664241155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,3584,0.0061930666367212926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,3072,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,2560,0.006227200229962667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,2048,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,1536,0.004520533482233683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,1024,0.004178133110205332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,768,0.003916800022125244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,512,0.00360000009338061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,256,0.0032287999987602235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,128,0.0031583999594052637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,64,0.0030933332939942675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,64,32,0.003101866692304611
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,65536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,16384,0.007011199990908305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,12288,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,10240,0.00660159985224406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,5120,64,0.003236266722281774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,8192,0.005475200215975444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,7168,0.006485333542029063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,6144,0.005884799857934316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,5120,0.005883733431498209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,4096,0.005525333185990652
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,3584,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,3072,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,2560,0.006156800190607706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,2048,0.005782400071620941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,1536,0.004885333279768625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,1024,0.004019200056791306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,768,0.004057600100835165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,512,0.003735466549793879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,256,0.003583999971548716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,128,0.003268266717592875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,64,0.0032373333970705668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,32,32,0.002855466554562251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,12288,0.23811413447062174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,16384,0.32957865397135416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,8192,0.16513706843058268
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,10240,0.2006378650665283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,6144,0.12673707008361818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,7168,0.1435647964477539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,4096,0.09059306780497232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,5120,0.10715093612670898
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,3584,0.07075733343760172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,3072,0.06161173184712728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,2560,0.05215573310852051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,2048,0.042530135313669844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,1024,0.024166399240493776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,1536,0.03324586749076843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,768,0.018910932540893554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,512,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,128,0.006192000210285186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,256,0.009125333031018574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,32,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,65536,64,0.0058773333827654515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,16384,0.09574399789174398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,12288,0.0676522652308146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,65536,0.3268927892049154
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,10240,0.058265598615010586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,8192,0.048844798405965166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,7168,0.036659200986226395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,6144,0.032017066081364946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,5120,0.02757866581281026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,4096,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,3584,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,3072,0.01806933283805847
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,2560,0.015681067109107973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,2048,0.013362133502960205
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,1536,0.011037866274515789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,1024,0.00844373305638631
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,512,0.004621866842110952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,768,0.006737066805362702
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,256,0.0039711999396483105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,128,0.003610666592915853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,64,0.003221333275238673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,16384,32,0.0034815999368826545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,16384,0.06901760101318359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,12288,0.051575465997060144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,65536,0.2338816006978353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,10240,0.0443061351776123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,8192,0.037886933485666914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,7168,0.03317866722742717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,6144,0.030584534009297688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,5120,0.02587413390477498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,4096,0.02300693392753601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,3584,0.01998400092124939
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,3072,0.018207999070485432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,1536,256,0.0036469332873821257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,2560,0.016156799594561257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,2048,0.010800000031789143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,1536,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,1024,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,768,0.005064533154169718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,512,0.004407466451327006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,256,0.003969066590070724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,128,0.003575466573238373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,64,0.00323840007185936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,12288,32,0.0033791999022165934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,16384,0.059596800804138185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,12288,0.04348586797714234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,65536,0.19616427421569824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,10240,0.037887998421986896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,8192,0.03140160044034322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,7168,0.029764266808827718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,6144,0.02648746569951375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,5120,0.022529067595799764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,4096,0.0191648006439209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,3584,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,3072,0.01588266690572103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,2560,0.012810666362444559
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,1536,0.009022933244705201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,2048,0.011524266997973124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,1024,0.007456000149250031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,768,0.006189866860707601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,512,0.005036800106366476
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,256,0.003607466568549474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,128,0.0036469332873821257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,64,0.0032042667269706728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,10240,32,0.00352960005402565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,16384,0.049356798330942794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,12288,0.034065067768096924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,65536,0.15906133651733398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,10240,0.029013333717981975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,8192,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,7168,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,6144,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,5120,0.016361600160598753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,4096,0.013665067156155905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,3584,0.01234346628189087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,3072,0.011485866705576579
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,2560,0.009947733084360758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,1536,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,2048,0.008999466896057129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,1024,0.005120000243186951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,768,0.004605866471926371
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,512,0.0040277334551016486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,256,0.0036608000596364343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,128,0.0036703998843828833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,64,0.003235200047492981
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,8192,32,0.0033141332368055976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,16384,0.04177920023600261
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,12288,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,65536,0.13875093460083007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,10240,0.028125866254170732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,8192,0.023959465821584067
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,7168,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,6144,0.016850133736928306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,5120,0.014860799908638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,4096,0.01267519990603129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,3584,0.01128426690896352
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,3072,0.010356266299883525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,2560,0.009196799993515015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,2048,0.00790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,1536,0.006226133306821187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,1024,0.004996266464392344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,768,0.004423466821511587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,512,0.004105599969625473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,256,0.003636266787846883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,4,512,7168,0.00790826678276062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,128,0.0032842665910720824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,64,0.003269333392381668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,7168,32,0.0032000000278155005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,12288,0.02983573277791341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,16384,0.03870933453241984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,10240,0.025548799832661943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,65536,0.12004693349202473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,8192,0.021895466248194377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,6144,0.01766080061594645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,7168,0.02013333241144816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,5120,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,3584,0.010423466563224792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,4096,0.011517866452534994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,3072,0.009476266304651896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,2560,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,2048,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,1536,0.005544533332188925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,1024,0.0047423998514811196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,512,0.003917866696914038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,256,0.0034858666360378264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,128,0.0032799998919169106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,768,0.004439466694990794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,64,0.003310933212439219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,6144,32,0.0031914666295051576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,16384,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,65536,0.10216106573740642
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,12288,0.025600000222524004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,10240,0.02271359960238139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,6144,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,8192,0.019718400637308755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,7168,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,5120,0.01441493332386017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,4096,0.010698666175206501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,3072,0.008726400136947633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,2560,0.007589333256085714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,3584,0.009884799520174663
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,2048,0.006636799871921539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,1536,0.005039999882380167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,1024,0.004204800228277842
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,768,0.004387199878692627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,512,0.003985066711902618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,256,0.0035946667194366455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,128,0.0035562666753927866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,32,0.003257599969704946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,5120,64,0.003066666672627131
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,16384,0.027989333868026732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,65536,0.08502613703409831
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,12288,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,10240,0.01930560072263082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,8192,0.01646506687005361
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,7168,0.014802133043607077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,6144,0.013802666465441385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,4096,0.011400533715883891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,5120,0.012344533205032348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,3072,0.010698666175206501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,3584,0.011332266529401143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,2560,0.009979733824729919
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,2048,0.008726400136947633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,1536,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,1024,0.005835733314355215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,768,0.005365333457787832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,256,0.003568000098069509
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,128,0.003269333392381668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,512,0.00447573314110438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,64,0.003260799994071325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,4096,32,0.0033759998778502146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,12288,0.01936639944712321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,16384,0.02362026572227478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,65536,0.0752288023630778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,10240,0.01690666675567627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,8192,0.014929067095120749
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,6144,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,5120,0.012197333574295043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,7168,0.014492799838383993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,4096,0.010493866602579753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,3584,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,3072,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,2560,0.009101866682370504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,2048,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,1024,0.005678933362166087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,1536,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,768,0.00494400014479955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,512,0.0061141331990559895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,256,0.0035466666022936503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,128,0.0031829332311948144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,32,0.0032106667757034303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3584,64,0.0031946666538715364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,16384,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,65536,0.06533226569493612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,12288,0.01731626590092977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,8192,0.0139957328637441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,10240,0.016029866536458333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,7168,0.012742400169372559
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,6144,0.011858133474985759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,5120,0.011059199770291645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,3584,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,4096,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,3072,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,2560,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,2048,0.0073183998465538025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,1536,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,1024,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,512,0.004519466559092204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,768,0.005003733436266581
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,128,0.0032170665760835014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,256,0.003956266740957896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,64,0.0034741332133611047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,3072,32,0.0032490665713946023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,12288,0.016089600324630738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,65536,0.058574934800465904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,10240,0.013844266533851624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,16384,0.02046826680501302
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,8192,0.012607999642690024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,7168,0.011958400408426922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,6144,0.010854400197664897
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,5120,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,4096,0.008718933661778767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,3584,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,3072,0.00831573357184728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,2560,0.008213333288828532
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,2048,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,1536,0.0066336000959078475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,1024,0.005380266904830932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,512,0.0044821331898371375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,768,0.004856533308823904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,256,0.0038954667747020722
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,128,0.0032490665713946023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,64,0.0033098667860031127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2560,32,0.003230933348337809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,16384,0.015827199816703795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,65536,0.048395733038584396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,12288,0.01363200048605601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,7168,0.010558933019638062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,8192,0.011290666460990906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,10240,0.012288000186284382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,6144,0.00960533320903778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,5120,0.008306133250395458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,4096,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,3072,0.0072170664866765336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,3584,0.007771733403205872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,2560,0.006702933212121327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,2048,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,1536,0.006636799871921539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,1024,0.005599999924500784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,768,0.005278933544953664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,512,0.004394666850566864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,256,0.004051200052102407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,64,0.0032426667710145317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,128,0.0034976000587145484
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,2048,32,0.003201066702604294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,65536,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,16384,0.014267733693122864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,10240,0.014596266547838846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,12288,0.011730133493741354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,8192,0.01308799982070923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,7168,0.011585066715876263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,6144,0.01097813347975413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,4096,0.007894399762153625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,5120,0.0074986666440963745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,3584,0.007445333401362102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,3072,0.007053866485754649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,2560,0.006669866542021434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,2048,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,1536,0.005774933099746704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,768,0.004409599800904592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,1024,0.005120000243186951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,256,0.00377813329299291
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,512,0.004041599979003271
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,128,0.0035861333211263022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,64,0.0031189332405726117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1536,32,0.0032650666932264962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,16384,0.014381866653760275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,12288,0.012356266379356384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,65536,0.02764799992243449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,10240,0.010935466488202412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,8192,0.009946667154630025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,7168,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,6144,0.00790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,5120,0.007112533350785573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,4096,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,3584,0.007052800059318543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,2560,0.005843199789524078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,2048,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,3072,0.0066101332505544026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,1536,0.0066431999206542965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,1024,0.005460266768932342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,768,0.004648533463478088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,512,0.004430933296680451
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,256,0.0036864000062147772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,128,0.003869866579771042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,64,0.0033759998778502146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,1024,32,0.0032821332414944967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,16384,0.012870400150616964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,65536,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,10240,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,8192,0.009124267101287841
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,7168,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,5120,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,4096,0.00739519993464152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,6144,0.0074976002176602675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,3584,0.0074869334697723385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,3072,0.006676266590754191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,2560,0.006676266590754191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,2048,0.005593599875768026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,1536,0.005784533421198527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,1024,0.004795733094215393
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,768,0.0044064000248909
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,512,0.003944533318281174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,128,0.003554133325815201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,256,0.00363520011305809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,64,0.003190399954716364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,32,0.003256533294916153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,16384,0.011047466595967611
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,65536,0.024100265900293984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,12288,0.009092266360918682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,10240,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,8192,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,7168,0.007863466441631318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,6144,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,4096,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,5120,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,3584,0.007086933155854543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,3072,0.00727040022611618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,2560,0.006263466676076253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,2048,0.006268799801667531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,1536,0.005235200126965841
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,1024,0.00447573314110438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,768,0.0040224000811576845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,512,0.003902933249870936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,128,0.003176533430814743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,64,0.0032149332265059153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,256,0.0035573333501815797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,512,32,0.003219199925661087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,65536,0.015270400047302245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,16384,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,12288,0.008259200056393941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,10240,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,8192,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,6144,0.006701866785685222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,7168,0.007053866485754649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,5120,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,4096,0.006668800115585327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,3584,0.006233599781990051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,2560,0.006292266647020976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,2048,0.005824000140031179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,3072,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,1536,0.004822400212287903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,1024,0.004362666606903076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,768,0.003958400090535482
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,512,0.0037258667250474296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,256,0.003366400053103765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,128,0.0032245332996050516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,64,0.0032170665760835014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,256,32,0.0031615999837716425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,16384,0.008102400104204814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,65536,0.013585066795349121
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,12288,0.007463466624418895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,10240,0.0074527998765309645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,8192,0.006676266590754191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,7168,0.0066442668437957765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,6144,0.0066336000959078475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,4096,0.0057536001006762184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,5120,0.005894400179386139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,3584,0.0062165334820747375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,3072,0.005755733450253805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,2560,0.006167466441790262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,2048,0.005847466488679251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,1536,0.004766933123270671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,768,0.003960533440113068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,1024,0.004060799876848856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,512,0.003688533355792364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,256,0.0034944000343481696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,128,0.003260799994071325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,64,0.0031146667897701263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,128,32,0.0031914666295051576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,16384,0.007053866485754649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,65536,0.010705066720644633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,12288,0.006634666522343953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,10240,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,7168,0.006222933530807495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,8192,0.006609066824118296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,6144,0.005858133236567179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,5120,0.006223999957243601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,4096,0.005562666555245717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,3584,0.00592853327592214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,3072,0.005883733431498209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,2560,0.006247466802597046
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,1536,0.004861866434415182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,2048,0.0055861334005991616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,768,0.004019200056791306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,512,0.003571200122435888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,1024,0.004010666658480962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,256,0.0035829332967599234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,128,0.003115733216206233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,64,0.0030965333183606463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,64,32,0.003542399903138479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,65536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,16384,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,12288,0.006258133550484974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,10240,0.005858133236567179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,8192,0.005791999896367391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,7168,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,6144,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,4096,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,5120,0.005755733450253805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,3584,0.005790933469931285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,3072,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,2048,0.0057888001203536986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,2560,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,1536,0.004926933348178864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,1024,0.0040618665516376495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,768,0.003955200066169103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,512,0.0036149332920710243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,256,0.003176533430814743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,64,0.0031989333530267083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,128,0.0032032000521818793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,32,32,0.0028959999481836954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,10240,0.20135253270467124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,12288,0.2359989325205485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,16384,0.33105812072753904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,8192,0.16377174059549968
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,7168,0.14315306345621745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,6144,0.12625919977823893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,5120,0.10618986288706463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,3584,0.07205653190612793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,4096,0.08755199909210205
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,3072,0.062498132387797035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,2560,0.052738134066263834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,2048,0.04225706656773885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,1024,0.023484800259272257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,1536,0.03400426705678304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,768,0.01835093299547831
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,512,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,256,0.008931199709574383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,128,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,64,0.005942399799823761
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,65536,32,0.005789866546789805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,12288,0.06652586857477824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,16384,0.09403626918792725
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,8192,0.048434134324391684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,10240,0.05768640041351318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,65536,0.3246080080668131
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,6144,0.032017066081364946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,7168,0.03877333402633667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,5120,0.027989333868026732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,3584,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,4096,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,3072,0.018143999576568603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,2560,0.01636373301347097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,2048,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,1024,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,768,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,1536,0.010713600118954976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,512,0.004690133531888326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,256,0.003930666546026865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,128,0.003589333345492681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,64,0.0036415999134381616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,16384,32,0.0032074667513370516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,12288,0.051438931624094644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,65536,0.23313280741373696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,10240,0.04410133361816406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,7168,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,8192,0.03645439942677815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,6144,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,5120,0.025600000222524004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,4096,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,3584,0.01978666583697001
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,3072,0.018080000082651773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,2560,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,2048,0.010705066720644633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,1024,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,1536,0.009136000275611877
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,768,0.004971733192602793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,512,0.004340266684691111
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,256,0.003739733248949051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,128,0.003470933437347412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,64,0.0031530665854612983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,32,0.0032170665760835014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,16384,0.05867520173390707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,65536,0.19501439730326336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,10240,0.03761386473973592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,12288,0.042803200085957845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,8192,0.031675734122594196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,7168,0.028875732421875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,6144,0.025942399104436235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,5120,0.02225386699040731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,4096,0.01904639999071757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,3584,0.018080000082651773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,3072,0.015631999572118124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,2560,0.013194666306177775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,2048,0.011922132968902589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,1024,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,1536,0.009476266304651896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,768,0.006246399879455566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,512,0.005222400029500326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,256,0.003589333345492681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,128,0.0032085334261258446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,64,0.0031914666295051576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,10240,32,0.00325546662012736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,65536,0.1577621301015218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,16384,0.04843519926071167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,12288,0.034065067768096924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,10240,0.029764266808827718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,8192,0.024168533086776734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,7168,0.02211946646372477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,6144,0.01898026665051778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,5120,0.016643200318018594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,4096,0.013983999689420065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,3584,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,3072,0.011115733782450359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,2048,0.008962133526802063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,2560,0.010191999872525533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,1536,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,1024,0.005378133555253347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,768,0.004676266511281332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,512,0.004349866509437561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,256,0.0035829332967599234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,128,0.0036117332677046456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,64,0.003180799881617228
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,8192,32,0.00323840007185936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,65536,0.1383413314819336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,16384,0.04157439867655437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,12288,0.03310933311780294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,10240,0.02826133370399475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,8192,0.023962666591008507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,7168,0.02136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,6144,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,5120,0.015620266397794088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,4096,0.012538666526476542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,3072,0.010295466581980387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,3584,0.012035199999809265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,2560,0.009080533186594646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,2048,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,1536,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,1024,0.004972800115744273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,768,0.004436266422271728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,512,0.004037333279848098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,256,0.0036309334139029183
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,64,0.0031946666538715364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,128,0.003533866753180822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,7168,32,0.0032127998769283296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,16384,0.03781973520914714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,65536,0.11994453271230061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,12288,0.029286400477091475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,8192,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,7168,0.019387733936309815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,6144,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,5120,0.015618133544921874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,4096,0.011524266997973124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,3072,0.00951039989789327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,3584,0.010601600011189777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,2560,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,2048,0.007223466535409291
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,1536,0.005927466849486033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,1024,0.004709333181381226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,768,0.004159999887148539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,512,0.003987200061480204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,256,0.0035157332817713416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,64,0.0031615999837716425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,128,0.0031776001056035364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,6144,32,0.0032287999987602235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,16384,0.03345066706339518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,65536,0.10141013463338215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,12288,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,10240,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,8192,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,7168,0.017464532454808553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,6144,0.016375466187795003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,2,768,12288,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,5120,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,4096,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,3584,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,2560,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,3072,0.008931199709574383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,2048,0.006602666775385539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,768,0.004232533276081085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,1536,0.005449600021044413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,1024,0.004824533561865489
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,512,0.003918933371702829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,256,0.0035690667728583017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,128,0.003221333275238673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,64,0.0032266666491826378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,5120,32,0.0031744000812371576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,16384,0.02764799992243449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,12288,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,65536,0.08383146921793619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,10240,0.019113600254058838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,8192,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,7168,0.0150709331035614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,6144,0.013565867145856222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,5120,0.012356266379356384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,3584,0.012880000472068786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,4096,0.011115733782450359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,3072,0.01181013286113739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,2560,0.010012800494829815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,1536,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,2048,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,1024,0.005870933334032694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,768,0.005051733553409576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,512,0.0044821331898371375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,256,0.0036330667634805044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,128,0.0031957333286603295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,32,0.0033013333876927694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,4096,64,0.0031360000371932983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,16384,0.02430293361345927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,65536,0.07481919924418132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,12288,0.019170133272806804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,10240,0.016910932461420693
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,8192,0.014803199966748556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,7168,0.014218667149543762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,6144,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,5120,0.011558399597803751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,3584,0.01243839959303538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,4096,0.010706133643786113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,3072,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,2560,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,2048,0.008281599978605907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,1536,0.006569600105285645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,1024,0.00551146666208903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,512,0.005825066566467285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,768,0.0046410664916038515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,256,0.003566933423280716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,128,0.003252266595760981
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,32,0.003235200047492981
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3584,64,0.00329066663980484
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,16384,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,65536,0.06584320068359376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,12288,0.0173962672551473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,10240,0.015748266379038492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,8192,0.01404906709988912
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,7168,0.012786133090655008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,6144,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,5120,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,3584,0.01049066682656606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,4096,0.00942080020904541
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,3072,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,2560,0.008483200271924337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,2048,0.007461333274841308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,1536,0.007052800059318543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,1024,0.005747200051943461
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,512,0.004220800101757049
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,768,0.005208533505598704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,256,0.003986133386691412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,128,0.0032543999453385672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,32,0.0032373333970705668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,3072,64,0.003171200056870779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,16384,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,65536,0.057275732358296715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,12288,0.015960533420244852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,10240,0.01441493332386017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,8192,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,7168,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,6144,0.010900266965230306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,5120,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,3584,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,4096,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,3072,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,2560,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,2048,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,1536,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,1024,0.005508266886075338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,768,0.004923733572165171
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,512,0.004300799965858459
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,256,0.003962666789690653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,32,0.0032277333239714304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,64,0.0031925333042939507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2560,128,0.0032416000962257386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,16384,0.015827199816703795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,65536,0.047991466522216794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,12288,0.013605333367983499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,10240,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,8192,0.011412266890207927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,7168,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,5120,0.00844586690266927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,6144,0.009215999643007915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,4096,0.007976533472537994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,3584,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,3072,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,2048,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,1536,0.0066431999206542965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,2560,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,1024,0.00544106662273407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,768,0.00487253318230311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,512,0.0043594668308893835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,256,0.003705599904060364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,128,0.0035775999228159585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,64,0.0032586666444937387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,2048,32,0.0032330666979153953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,65536,0.03809279998143514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,12288,0.011890133221944172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,16384,0.014083199699719749
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,10240,0.01527679959932963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,8192,0.01363200048605601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,7168,0.012355200449625651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,5120,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,6144,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,3584,0.007076266904671986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,4096,0.007876266539096833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,3072,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,2560,0.006670933465162914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,1536,0.005791999896367391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,2048,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,1024,0.005016533533732096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,768,0.004469333092371622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,512,0.004101333270470301
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,256,0.003589333345492681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,128,0.0035391998787721
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,32,0.003235200047492981
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1536,64,0.0032597333192825317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,65536,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,16384,0.01486186683177948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,12288,0.012547199924786886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,10240,0.011538133025169373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,8192,0.0105621337890625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,7168,0.009546666344006857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,6144,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,5120,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,3072,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,3584,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,4096,0.007089066505432129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,2560,0.005884799857934316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,2048,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,1536,0.0065760001540184024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,1024,0.0054058666030565895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,768,0.004744533201058706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,512,0.004378666480382284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,256,0.0035584000249703727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,128,0.0035818666219711304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,32,0.003236266722281774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,1024,64,0.0032320000231266023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,65536,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,16384,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,12288,0.011116799712181092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,10240,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,8192,0.009946667154630025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,6144,0.007392000158627827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,7168,0.0092031995455424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,5120,0.007011199990908305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,4096,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,3072,0.007046400010585785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,3584,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,2560,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,2048,0.005366399884223938
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,1536,0.0057888001203536986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,768,0.004457599918047587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,1024,0.0045952002207438145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,256,0.00348693331082662
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,512,0.003947733342647553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,128,0.0035103999078273775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,64,0.00322026660044988
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,65536,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,768,32,0.003286399940649668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,12288,16384,0.06775466601053873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,16384,0.011243733763694762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,12288,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,8192,0.008273066580295562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,10240,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,7168,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,6144,0.0074976002176602675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,5120,0.007111466427644093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,3584,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,4096,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,3072,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,2560,0.006669866542021434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,2048,0.0062943999965985615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,1536,0.0051466668645540874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,1024,0.0043029333154360454
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,768,0.004041599979003271
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,512,0.003912533322970072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,128,0.003221333275238673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,256,0.00348693331082662
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,64,0.003209600100914637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,512,32,0.003173333406448364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,65536,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,10240,0.007456000149250031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,12288,0.008376533786455791
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,16384,0.008727467060089112
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,7168,0.006636799871921539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,8192,0.0070165331164995836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,6144,0.0067007998625437425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,5120,0.006485333542029063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,4096,0.006295466423034668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,3072,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,3584,0.00619946668545405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,2560,0.006167466441790262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,2048,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,1536,0.004762666424115499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,1024,0.00436160018046697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,512,0.0036320000886917113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,256,0.0035989334185918174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,128,0.0031701333820819853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,768,0.003988266736268997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,64,0.0030805334448814393
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,256,32,0.0031061333914597826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,65536,0.014016000429789224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,16384,0.00790826678276062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,12288,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,10240,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,8192,0.0065760001540184024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,6144,0.006260266900062561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,7168,0.006822399795055389
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,5120,0.006007466713587443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,4096,0.0057888001203536986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,3584,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,2560,0.00631466656923294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,3072,0.005905066430568695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,2048,0.005905066430568695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,1536,0.004806399842103322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,1024,0.004496000210444133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,512,0.003504000107447306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,256,0.003368533402681351
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,128,0.003304533412059148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,64,0.0032106667757034303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,32,0.00308693324526151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,65536,0.01069546639919281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,16384,0.006985599795977275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,12288,0.006227200229962667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,10240,0.006190933287143707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,8192,0.006200533111890157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,7168,0.006227200229962667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,6144,0.006192000210285186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,4096,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,5120,0.005789866546789805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,3584,0.006223999957243601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,3072,0.005817600091298421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,2560,0.005859200159708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,2048,0.005849599838256836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,1536,0.004675200084845225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,1024,0.004062933226426443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,768,0.004154666761557261
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,512,0.0036042665441830954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,256,0.003272533416748047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,128,0.003270400067170461
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,64,0.003115733216206233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,64,32,0.003138133386770884
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,65536,0.009125333031018574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,16384,0.006635733445485433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,12288,0.006234666705131531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,10240,0.00622506688038508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,8192,0.0054400001962979635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,7168,0.005824000140031179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,6144,0.00591893345117569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,5120,0.005815466741720835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,4096,0.005381333331267038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,3584,0.006190933287143707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,3072,0.005782400071620941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,2560,0.005825066566467285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,2048,0.005850666761398315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,1536,0.004802133142948151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,1024,0.003953066716591517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,768,0.004041599979003271
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,512,0.003601066768169403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,256,0.003219199925661087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,128,0.003271466741959254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,64,0.003127466638882955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,32,32,0.003070933371782303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,10240,3.7410527547200525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,12288,4.604997253417968
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,16384,6.316168721516927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,7168,2.3111338297526043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,8192,3.0745290120442705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,6144,2.325880432128906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,4096,1.375880559285482
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,5120,1.676360575358073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,3584,1.182138697306315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,3072,1.045196787516276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,2560,0.8372906366984049
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,2048,0.6969343821207683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,1024,0.3949909210205078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,1536,0.5569536209106445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,768,0.3479893366495768
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,128,0.1884501298268636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,512,0.2790741284688314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,256,0.2295466740926107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,64,0.18920106887817384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,65536,32,0.18865493138631184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,12288,1.2386656443277995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,16384,1.6646155039469401
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,10240,0.9872725168863932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,8192,0.8258901596069336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,7168,0.710588773091634
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,6144,0.6248789469401042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,4096,0.4126720110575358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,5120,0.4990634600321452
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,3072,0.30281492869059246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,3584,0.35645440419514973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,2048,0.21384639739990235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,2560,0.25245013236999514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,1024,0.12270932992299396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,1536,0.16670613288879393
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,512,0.09366613229115804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,768,0.108406400680542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,128,0.06867626508076986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,256,0.07796160380045572
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,64,0.0686090628306071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,32,0.06988906860351562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,16384,65536,7.037849426269531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,16384,1.3261812845865886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,12288,1.008298683166504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,8192,0.6821887969970704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,10240,0.8376319885253907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,6144,0.508348814646403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,7168,0.5898229598999023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,4096,0.34205118815104163
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,5120,0.4266677220662435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,3072,0.25504426956176757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,3584,0.2986655871073405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,2048,0.17517120043436687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,2560,0.21275307337443033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,1024,0.10294506549835206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,1536,0.1373184045155843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,768,0.09168213208516439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,512,0.07570772965749105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,256,0.06970026493072509
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,128,0.061441067854563394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,64,0.06181333462397257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,32,0.06017706791559855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,12288,65536,5.27503662109375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,12288,0.857701301574707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,16384,1.1977045694986979
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,8192,0.5902346928914388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,10240,0.7199391682942708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,6144,0.4343136151631673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,7168,0.5020650545756022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,4096,0.28958721160888673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,5120,0.3594581286112467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,3072,0.2140501340230306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,3584,0.255454937616984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,float16,1,128,768,0.003969066590070724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,2560,0.18179413477579753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,2048,0.15155199368794758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,1536,0.11826879978179931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,768,0.08065600395202636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,1024,0.0899061361948649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,512,0.06734506289164224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,128,0.05147306521733602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,256,0.0575488011042277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,64,0.050892798105875645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,32,0.04925440152486165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,10240,65536,4.6467432657877605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,12288,0.7452330907185872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,16384,0.9998336156209311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,10240,0.6366207758585612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,8192,0.49332907994588215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,6144,0.38645760218302405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,7168,0.44660053253173826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,5120,0.3147775967915853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,4096,0.2532693386077881
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,3584,0.21951467196146646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,3072,0.18940587043762208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,2560,0.16226986249287922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,2048,0.13103679815928143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,1536,0.10386772950490315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,512,0.05939199924468994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,1024,0.08120319843292237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,768,0.07167999744415283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,256,0.051643733183542886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,128,0.04526079893112182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,64,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,32,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,12288,0.6851231892903645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,16384,0.9165130615234375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,8192,65536,4.047124226888021
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,10240,0.5786965052286784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,8192,0.4671146710713704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,7168,0.41151145299275715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,6144,0.3479189236958822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,4096,0.23248213132222495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,5120,0.28958826065063475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,3584,0.19964586893717448
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,3072,0.17408000628153483
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,2560,0.14656960169474284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,2048,0.11977386474609375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,1536,0.09653013547261556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,1024,0.07396693229675293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,768,0.06655786832173666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,512,0.05546666781107584
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,128,0.04205013513565063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,256,0.048230401674906415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,32,0.039185067017873124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,64,0.03932160139083862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,12288,0.6609578450520833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,7168,65536,3.6785494486490884
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,16384,0.8463701248168946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,10240,0.539034652709961
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,8192,0.4390890757242839
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,7168,0.37382825215657556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,4096,0.21179733276367188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,5120,0.2704042752583822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,6144,0.33071788152058923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,3584,0.18486612637837727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,3072,0.16233919461568197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,2560,0.13735253016153973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,1024,0.06799360116322836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,2048,0.11106986999511718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,1536,0.09069226582845052
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,256,0.05236053466796875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,512,0.058369068304697666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,768,0.06191786527633667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,64,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,128,0.039527467886606854
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,32,0.03645546833674113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,12288,0.6019754409790039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,16384,0.7970816294352214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,6144,65536,3.438934326171875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,10240,0.493943468729655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,8192,0.3942399978637695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,7168,0.3426645278930664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,6144,0.2994858741760254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,5120,0.2448042710622152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,4096,0.19158933957417806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,3584,0.16936960220336914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,3072,0.14608960151672362
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,2560,0.12226666609446209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,1536,0.08294293085734049
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,1024,0.062021334966023765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,2048,0.10226240158081054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,256,0.04109546740849813
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,768,0.05785599946975708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,512,0.0474122683207194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,64,0.04082346757253011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,128,0.04109653234481812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,32,0.03891199827194214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,12288,0.5368490854899088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,16384,0.7155029296875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,5120,65536,3.064763641357422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,7168,0.30385494232177734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,10240,0.43595199584960936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,8192,0.3519477208455404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,4096,0.17271253267923992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,5120,0.2174623966217041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,6144,0.2613248030344645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,3584,0.15032320022583007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,2560,0.10939733187357585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,3072,0.12864853541056315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,1536,0.0729087988535563
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,2048,0.0920576016108195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,1024,0.05717333157857259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,768,0.0504149317741394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,512,0.04314560095469157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,256,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,128,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,64,0.03304106593132019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,32,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,12288,0.4811093330383301
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,16384,0.6512981414794922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,4096,65536,2.743499755859375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,7168,0.2865824063618978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,10240,0.40987199147542314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,8192,0.3309226671854655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,4096,0.1600170612335205
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,6144,0.24780799547831217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,5120,0.20257919629414878
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,3584,0.14008426666259766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,3072,0.12349332968393963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,2560,0.10298026402791341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,2048,0.08700586954752604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,1536,0.07116693655649821
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,1024,0.05376000006993612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,512,0.04089173475901286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,768,0.04928853511810303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,256,0.03351786533991496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,128,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,64,0.028807467222213744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,32,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,12288,0.47230186462402346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3584,65536,2.481424967447917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,16384,0.6191445032755534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,7168,0.27688961029052733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,10240,0.3874805450439453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,8192,0.30952107111612953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,4096,0.15202986399332682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,5120,0.19548160235087078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,6144,0.2370218594868978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,3584,0.133188263575236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,2560,0.0991914669672648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,3072,0.11482453346252441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,2048,0.08127040068308512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,1536,0.06601279973983765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,1024,0.05092693169911703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,512,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,768,0.04696640173594157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,256,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,64,0.028467200199762982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,128,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,32,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,12288,0.43807465235392257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,16384,0.5808117548624675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,3072,65536,2.4052383422851564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,7168,0.265011199315389
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,10240,0.3704490661621094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,8192,0.30132907231648765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,4096,0.1496405283610026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,5120,0.18715306917826335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,6144,0.2274986743927002
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,3584,0.13110613028208415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,2560,0.09669866561889648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,3072,0.1107968012491862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,1536,0.06526293357213339
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,2048,0.07973439693450927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,1024,0.04894719918568929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,768,0.043689600626627606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,512,0.035225598017374675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,256,0.030855466922124226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,128,0.028467200199762982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,64,0.024985599517822265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,32,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,12288,0.4098047892252604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,16384,0.5440842946370442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2560,65536,2.2217386881510417
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,7168,0.23804693222045897
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,10240,0.34614718755086266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,8192,0.2749781290690104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,4096,0.13431466420491536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,6144,0.20496959686279298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,5120,0.16984747250874838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,3584,0.11874879995981853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,3072,0.10007999738057453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,2560,0.08625493049621583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,1536,0.057240533828735354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,1024,0.04362346728642781
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,2048,0.07113280296325683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,256,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,768,0.039867734909057616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,512,0.03324693242708842
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,64,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,128,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,32,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,12288,0.3796991984049479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,16384,0.5022037188212077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,2048,65536,2.0788543701171873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,7168,0.22572372754414877
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,10240,0.3174378712972005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,8192,0.25620479583740235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,4096,0.12581546306610109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,5120,0.1576266606648763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,6144,0.19486719767252605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,3584,0.10939733187357585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,2560,0.07994133631388346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,3072,0.09420693715413411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,1536,0.05502293507258097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,2048,0.06543360153834024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,1024,0.04430400133132935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,768,0.03959360122680664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,512,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,256,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,128,0.027170133590698243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,64,0.02327573299407959
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,32,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,12288,0.3437568028767904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1536,65536,1.927578608194987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,16384,0.4543146769205729
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,7168,0.20688319206237793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,10240,0.2890421231587728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,8192,0.2324831962585449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,4096,0.11359679698944092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,5120,0.14376959800720215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,6144,0.17810880343119304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,3584,0.09785919984181722
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,2560,0.06990506649017333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,3072,0.08441279729207357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,2048,0.057139201958974206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,1536,0.0469322681427002
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,1024,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,512,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,768,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,256,0.025326933463414508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,64,0.020750933885574342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,128,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,32,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,12288,0.32805439631144206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,1024,65536,1.7475925445556642
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,16384,0.43233280181884765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,7168,0.1996448040008545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,10240,0.27900587717692055
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,8192,0.2270890712738037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,4096,0.11025066375732422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,6144,0.17141653696695963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,5120,0.1406976064046224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,3584,0.09390079975128174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,3072,0.08185173670450846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,2560,0.06666239897410074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,2048,0.05580799976984659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,1536,0.04498773415883382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,1024,0.035224533081054686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,768,0.03297280073165894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,512,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,256,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,128,0.022871466477711995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,64,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,32,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,12288,0.31286614735921225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,768,65536,1.6674816131591796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,16384,0.4107626597086589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,7168,0.1885877291361491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,8192,0.2135039965311686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,10240,0.26391894022623696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,4096,0.10195519924163818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,5120,0.133188263575236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,6144,0.16206506093343098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,3072,0.07283946673075357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,2560,0.0636576016743978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,3584,0.08755199909210205
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,1536,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,2048,0.05116586685180664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,1024,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,512,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,768,0.03140053351720174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,256,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,128,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,64,0.020205867290496827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,32,0.020206934213638304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,12288,0.3011242548624674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,16384,0.3961514790852865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,512,65536,1.5927637736002604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,7168,0.1799509366353353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,10240,0.25347414016723635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,8192,0.2047658602396647
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,4096,0.09550613562266032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,6144,0.15332800547281902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,5120,0.12598400115966796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,3584,0.07997439702351888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,3072,0.06925653616587321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,2560,0.055910400549570714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,1536,0.040277334054311116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,1024,0.032560000816981
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,2048,0.047172268231709794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,256,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,768,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,512,0.024850134054819742
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,64,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,128,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,32,0.01795413295427958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,12288,0.2959338823954264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,256,65536,1.5264437357584635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,16384,0.38966506322224936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,7168,0.17606080373128255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,10240,0.2484224001566569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,8192,0.20032854080200196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,4096,0.09134079615275065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,6144,0.14970879554748534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,5120,0.1210367997487386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,3584,0.07601493199666341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,3072,0.06813013553619385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,2560,0.05420373280843099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,2048,0.04519253174463908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,1536,0.03863893349965413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,1024,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,768,0.029425066709518433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,512,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,256,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,128,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,32,0.016860800981521606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,12288,0.2954581260681152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,16384,0.38830080032348635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,128,65536,1.5123797098795573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,7168,0.17530879974365235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,10240,0.24746665954589844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,8192,0.19978240331013997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,4096,0.093013334274292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,5120,0.12038826942443848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,6144,0.14970879554748534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,2560,0.05334933201471964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,3584,0.0779263973236084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,3072,0.065774933497111
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,1536,0.03891093333562215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,2048,0.045466665426890054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,1024,0.031061333417892457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,512,0.024782933791478477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,768,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,256,0.02198293407758077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,128,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,12288,0.2935381253560384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,64,65536,1.5093077341715495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,16384,0.3874133427937826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,7168,0.17435305913289387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,8192,0.19937280019124348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,10240,0.24685227076212563
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,4096,0.09045226573944092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,5120,0.12028586864471436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,6144,0.1484117348988851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,3072,0.06070079803466797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,2560,0.053179732958475744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,3584,0.0774826685587565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,1536,0.03863893349965413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,2048,0.045124268531799315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,1024,0.030789333581924438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,512,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,768,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,256,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,128,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,32,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,10240,1.8075669606526692
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,12288,2.1687296549479167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,16384,2.959362030029297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,7168,1.2183551788330078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8192,32,65536,1.502344512939453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,8192,1.391823959350586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,6144,0.9922570546468099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,4096,0.6983008066813151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,3072,0.5082794825236003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,5120,0.8697173436482748
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,3584,0.6031712214152019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,1536,0.2914965311686198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,2048,0.3603455861409505
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,2560,0.44475520451863604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,1024,0.21063680648803712
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,256,0.12731733322143554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,512,0.15059626897176107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,768,0.18514026006062825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,128,0.10315093199412029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,64,0.10622080167134602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,65536,32,0.10454933643341065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,10240,0.5127498626708984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,12288,0.6194847742716472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,16384,0.8157194773356119
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,8192,0.40625492731730145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,7168,0.36007359822591145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,6144,0.3078144073486328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,4096,0.21452800432840982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,5120,0.2567509333292643
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,3584,0.18954240481058757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,2560,0.13987733523050944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,3072,0.16411306063334147
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,2048,0.1144821325937907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,1024,0.0747530698776245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,1536,0.09448213577270508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,768,0.06686720053354898
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,256,0.04911786715189616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,512,0.05939199924468994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,64,0.04177706638971965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,128,0.04143786827723185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,32,0.0413696010907491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,16384,65536,3.5248502095540366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,12288,0.5097077369689942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,16384,0.6703776041666667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,10240,0.4301482518513997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,8192,0.3387733459472656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,7168,0.290338134765625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,5120,0.2130261262257894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,6144,0.2544309298197428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,4096,0.17107733090718585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,3584,0.1565344015757243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,3072,0.1349290688832601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,2560,0.11581546465555828
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,2048,0.09652907053629557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,1536,0.07990612983703613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,768,0.057479465007781984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,512,0.05621866782506307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,1024,0.0604479988416036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,256,0.04911893208821615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,128,0.03686399857203166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,64,0.035702399412790936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,32,0.037571199735005695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,12288,65536,2.67236811319987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,12288,0.4634623845418294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,16384,0.6043306350708008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,10240,0.36512533823649085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,8192,0.2960042635599772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,7168,0.2529962698618571
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,6144,0.22108160654703773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,5120,0.18688000043233235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,3584,0.13458666801452637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,4096,0.1496405283610026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,3072,0.11919466654459636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,2560,0.10202453136444092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,2048,0.08417279720306396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,1536,0.07253440221150717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,1024,0.0549888014793396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,768,0.051337599754333496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,256,0.04686506589253743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,512,0.04707093238830566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,128,0.03406399885813395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,64,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,32,0.034542934099833174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,10240,65536,2.4410463968912763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,12288,0.401032543182373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,16384,0.5234688123067219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,10240,0.3194197336832682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,8192,0.2515626589457194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,7168,0.2154143969217936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,6144,0.1897119998931885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,5120,0.1596768061319987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,4096,0.12907520135243733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,3584,0.11980693340301514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,3072,0.10359466870625814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,2560,0.0897706667582194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,2048,0.07454720338185629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,1536,0.06406826575597127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,1024,0.048536535104115805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,768,0.046216531594594316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,512,0.04157439867655437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,256,0.03502080043156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,128,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,32,0.035292800267537436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,64,0.03645439942677815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,8192,65536,2.0334239959716798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,12288,0.35382719039916993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,16384,0.4633941332499186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,10240,0.2894495964050293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,8192,0.2295466740926107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,7168,0.19677866299947103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,5120,0.1477290630340576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,4096,0.11854506333669027
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,6144,0.1699168046315511
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,3584,0.11069440046946208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,3072,0.09328640302022298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,2560,0.08396906852722168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,1536,0.05792533159255982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,2048,0.06987093289693197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,1024,0.04526079893112182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,512,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,768,0.043212799231211345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,256,0.03222293257713318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,64,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,32,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,65536,1.8273621877034505
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,16384,0.4506986618041992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,12288,0.34396158854166664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,8192,0.21780479749043785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,10240,0.27108586629231773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,7168,0.18961067199707032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,6144,0.16233812967936198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,5120,0.1374538739522298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,4096,0.11042133172353108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,3584,0.10241920153299969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,3072,0.08727893034617105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,2560,0.07966720263163249
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,65536,1.6928085327148437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,2048,0.0636245330174764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,1024,0.04334933360417684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,1536,0.05553386608759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,768,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,512,0.03686293363571167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,256,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,128,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,64,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,6144,32,0.026691200335820515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,12288,0.3025578816731771
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,16384,0.3947861353556315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,10240,0.25641066233317056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,8192,0.19834879239400227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,6144,0.1484810670216878
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,7168,0.17537493705749513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,4096,0.10455040136973064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,5120,0.12622506618499757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,3072,0.08178239663441976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,3584,0.09574399789174398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,2048,0.06031359831492106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,2560,0.07253333727518717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,1024,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,1536,0.05218986670176188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,65536,1.526476796468099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,768,0.0389792005221049
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,512,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,128,0.025600000222524004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,256,0.028945066531499225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,64,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,5120,32,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,12288,0.2727253278096517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,16384,0.36540053685506185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,8192,0.17565013567606608
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,10240,0.2195807933807373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,6144,0.1300821304321289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,7168,0.1527125358581543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,5120,0.11021653016408284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,3584,0.08400320212046306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,3072,0.07195306619008382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,65536,1.3635594685872396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,2560,0.06358933448791504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,1536,0.047378134727478025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,2048,0.053384534517923986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,1024,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,768,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,512,0.03174399932225545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,256,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,128,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,32,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,64,0.025191466013590496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,16384,0.3512661298116048
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,12288,0.26344106992085775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,10240,0.20148800214131674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,8192,0.15885547002156575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,65536,1.3226324717203775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,7168,0.13878506024678547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,6144,0.1189194679260254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,5120,0.10209279855092365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,4096,0.08369386990865071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,3072,0.0669696013132731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,3584,0.07622186342875162
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,2560,0.059731201330820716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,2048,0.04976640144983928
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,1536,0.04416853189468384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,1024,0.03481493393580119
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,768,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,512,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,256,0.02648640076319377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,128,0.02443839907646179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,64,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3584,32,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,16384,0.32064854303995766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,12288,0.24186879793802896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,10240,0.19302399953206378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,8192,0.1527125358581543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,65536,1.2115946451822917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,6144,0.11468799908955891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,7168,0.13370025952657064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,5120,0.09687146345774332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,4096,0.08034986654917399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,3584,0.07273706595102945
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,3072,0.06386346817016601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,2560,0.057275732358296715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,2048,0.048640000820159915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,1536,0.043212799231211345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,1024,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,768,0.03427199920018514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,512,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,256,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,128,0.02519039909044902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,64,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,3072,32,0.024233599503835045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,16384,0.30317118962605794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,7168,128,0.028809599081675213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,12288,0.22865920066833495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,10240,0.183570130666097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,8192,0.14172053337097168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,7168,0.12588480313618977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,6144,0.10670080184936523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,5120,0.09137492974599203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,65536,1.141555150349935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,3584,0.06795946756998697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,4096,0.07437653541564941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,3072,0.05884586572647095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,2560,0.054611198107401525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,2048,0.045943466822306316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,1536,0.039662933349609374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,1024,0.03297280073165894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,512,0.02867199977238973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,768,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,256,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,128,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,64,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2560,32,0.02130026618639628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,12288,0.20851945877075195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,16384,0.27347625096639
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,10240,0.17332906723022462
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,8192,0.13369919459025065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,7168,0.12083306312561035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,6144,0.09983893235524496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,5120,0.0865610678990682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,4096,0.06932480335235595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,3584,0.06550186475118001
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,3072,0.05638826688130697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,2560,0.053384534517923986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,2048,0.04491839806238811
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,65536,1.0292896270751952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,1536,0.039937067031860354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,1024,0.031674667199452715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,768,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,512,0.028603732585906982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,64,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,128,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,256,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,2048,32,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,12288,0.1936384042104085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,16384,0.2543605327606201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,10240,0.160698668162028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,8192,0.12532052993774415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,7168,0.10861226717631023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,6144,0.09475306669871011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,5120,0.079257599512736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,4096,0.06393173138300577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,3584,0.05915306806564331
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,3072,0.051369599501291906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,2560,0.04724053144454956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,2048,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,65536,0.9577130635579427
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,1536,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,768,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,1024,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,512,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,4096,4096,0.09226133028666178
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,256,0.022663466135660806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,128,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,64,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1536,32,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,10240,0.14506667455037434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,12288,0.17646826108296712
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,16384,0.23292479515075684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,7168,0.1008639971415202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,8192,0.11444906393686931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,6144,0.08144426345825195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,4096,0.05826453367869059
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,5120,0.07127040227254232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,3584,0.05358933210372925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,2560,0.043212799231211345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,3072,0.04771840174992879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,2048,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,1536,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,1024,0.027646932999293012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,512,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,768,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,256,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,128,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,32,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,1024,65536,0.884667714436849
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,12288,0.16889173189798992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,16384,0.22422186533610025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,10240,0.13813865979512532
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,8192,0.10673387050628662
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,7168,0.0920576016108195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,6144,0.07768747011820475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,4096,0.05369173288345337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,5120,0.06546773513158163
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,3584,0.04980053504308064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,3072,0.04526079893112182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,2048,0.03638613224029541
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,2560,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,1024,0.027514666318893433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,1536,0.03283519943555196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,768,0.026555732885996504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,512,0.024577067295710246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,256,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,64,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,32,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,768,65536,0.8640511830647787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,12288,0.16247572898864746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,16384,0.2147669315338135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,10240,0.1335968017578125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,8192,0.10284266471862794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,7168,0.08724693457285562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,6144,0.07369386355082194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,5120,0.06321599880854288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,4096,0.05003840128580729
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,3584,0.04922026793162028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,2048,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,3072,0.04300800164540609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,1024,0.026149332523345947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,1536,0.031402667363484696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,512,0.023959465821584067
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,768,0.02491733431816101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,256,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,128,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,65536,0.8191296259562174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,16384,0.20879359245300294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,12288,0.15605653127034505
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,10240,0.1265664021174113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,8192,0.09588053226470947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,7168,0.08226453463236491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,6144,0.06840213139851889
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,5120,0.05765120188395182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,4096,0.047172268231709794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,3584,0.045125333468119304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,3072,0.039867734909057616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,2560,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,65536,0.7764991760253906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,2048,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,1024,0.02539413372675578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,1536,0.030037333567937214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,768,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,512,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,256,0.020002132654190062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,64,0.01795413295427958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,256,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,12288,0.1521663983662923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,16384,0.20579093297322593
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,10240,0.12393706639607746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,8192,0.09468479951222739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,6144,0.0684384028116862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,7168,0.07860906918843588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,4096,0.04703573385874431
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,5120,0.05584213336308798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,3072,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,3584,0.043483734130859375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,2048,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,2560,0.0370688001314799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,65536,0.769809087117513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,1024,0.024779733022054037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,1536,0.028945066531499225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,512,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,256,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,768,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,64,0.01713493267695109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,128,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,12288,0.15196372667948405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,16384,0.20333226521809897
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,8192,0.0942080020904541
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,10240,0.12216213544209797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,7168,0.0796341339747111
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,6144,0.06581120093663534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,5120,0.05748053391774496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,4096,0.045602134863535565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,3584,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,3072,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,2560,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,2048,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,65536,0.7634613037109375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,1536,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,1024,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,768,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,512,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,256,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,64,32,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,12288,0.15155307451883954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,16384,0.2023082733154297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,10240,0.1252010663350423
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,8192,0.09530133406321208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,7168,0.08028053442637126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,6144,0.06986986796061198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,4096,0.04713813463846843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,5120,0.05573973258336386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,3584,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,3072,0.039049601554870604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,2048,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,2560,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,65536,0.7610709508260091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,1536,0.030037333567937214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,1024,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,512,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,768,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,64,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,32,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,12288,1.0505877176920573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,16384,1.4357855478922525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,10240,0.8368810653686524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,8192,0.667033576965332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,7168,0.587229855855306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,6144,0.5071221351623535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,5120,0.4423701286315918
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,4096,0.35304107666015627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,3584,0.31778132120768227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,3072,0.2723157246907552
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,2560,0.23077546755472816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,2048,0.18906453450520833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,1536,0.1509365399678548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,1024,0.11431146462758382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,768,0.10069333712259929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,512,0.08454720179239908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,256,0.07287360032399495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,128,0.06502506732940674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,64,0.06560426553090414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,65536,32,0.06389760176340739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,16384,0.4404575983683269
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,12288,0.3281909306844076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,10240,0.2594837347666422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,65536,1.7366687774658203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,8192,0.2095775922139486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,7168,0.18967893918355305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,6144,0.15974399248758953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,5120,0.14008320172627767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,3584,0.10646186669667561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,4096,0.11202666759490967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,3072,0.09281173547108969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,2560,0.07837119897206625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,2048,0.06754986445109049
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,1536,0.05775359869003296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,1024,0.04775360027949015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,768,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,512,0.03911786476771037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,128,0.03604480028152466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,256,0.03078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,64,0.0348853349685669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,16384,32,0.033587201436360674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,16384,0.3521514574686686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,512,2560,0.03904746770858765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,12288,0.26699094772338866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,10240,0.21377600034077965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,8192,0.17517120043436687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,65536,1.3602804819742838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,7168,0.15530667304992676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,6144,0.1342463970184326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,4096,0.09253439903259278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,5120,0.11909120082855225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,3584,0.08741652965545654
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,3072,0.07731093565622965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,2560,0.06812907059987386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,2048,0.057411201794942225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,1536,0.05007359981536865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,1024,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,768,0.03822933435440064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,512,0.03338239987691243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,256,0.030446932713190718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,64,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,128,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,12288,32,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,12288,0.2275008042653402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,16384,0.2949119885762533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,10240,0.19507306416829426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,8192,0.15694506963094074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,7168,0.14308692614237467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,6144,0.12141226927439372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,5120,0.10915946960449219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,4096,0.08755199909210205
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,65536,1.14858767191569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,3584,0.0846506675084432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,3072,0.07293972969055176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,2560,0.0636245330174764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,2048,0.05536426703135172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,1024,0.03932053248087565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,768,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,1536,0.04799253145853678
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,256,0.028194133440653486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,512,0.032356266180674234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,128,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,32,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,10240,64,0.026691200335820515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,12288,0.20367040634155273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,16384,0.26180267333984375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,10240,0.1697109381357829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,8192,0.135372797648112
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,6144,0.10591466426849365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,7168,0.12588266531626385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,4096,0.07655893166859945
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,5120,0.09321706295013428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,65536,1.0481322606404624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,3072,0.0612010677655538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,3584,0.0703488032023112
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,2048,0.04713919957478841
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,1536,0.04437333345413208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,2560,0.05358933210372925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,1024,0.03863893349965413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,768,0.03426880041758219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,512,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,256,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,128,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,64,0.024784000714619954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,8192,32,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,12288,0.17134826978047688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,16384,0.22961600621541342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,10240,0.14274560610453288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,8192,0.11847679615020752
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,7168,0.10690773328145345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,6144,0.09236480394999186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,5120,0.08161386648813883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,65536,0.9171967824300131
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,4096,0.06724159717559815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,3584,0.06314666668574015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,3072,0.058606934547424314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,2560,0.04993706544240316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,2048,0.04444160064061482
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,1536,0.0392522652943929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,1024,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,768,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,512,0.028194133440653486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,128,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,256,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,64,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,7168,32,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,12288,0.16616106033325195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,16384,0.22408533096313477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,8192,0.11403840382893879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,10240,0.13953065872192383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,6144,0.0877568006515503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,7168,0.1044810692469279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,4096,0.06587839921315511
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,5120,0.0779263973236084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,65536,0.8544928232828776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,3072,0.053965866565704346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,3584,0.06184959808985392
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,2048,0.0423253337542216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,1536,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,2560,0.04860586722691854
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,1024,0.03290346662203471
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,768,0.03099306623140971
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,512,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,256,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,128,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,64,0.023895466327667238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,6144,32,0.024235733350118003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,12288,0.15339520772298176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,16384,0.20497066179911294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,10240,0.12134400208791096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,8192,0.10100053151448567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,7168,0.09236480394999186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,6144,0.07987306912740072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,5120,0.07048640251159669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,65536,0.8306005477905274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,4096,0.05785599946975708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,3584,0.05546453396479288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,3072,0.05130240122477213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,2560,0.04491946697235107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,2048,0.040004265308380124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,1536,0.0357045332590739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,768,0.028398933013280232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,1024,0.03065173427263896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,512,0.02573546568552653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,256,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,128,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,64,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,5120,32,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4096,32,256,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,12288,0.13134506543477376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,16384,0.17749333381652832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,10240,0.1134602705637614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,8192,0.09232959747314454
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,7168,0.08707306385040284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,6144,0.07273813088734946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,5120,0.06502399841944376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,4096,0.05591146548589071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,3072,0.04676266511281331
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,3584,0.05218986670176188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,2560,0.04369066556294759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,1024,0.02956266601880391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,2048,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,1536,0.03351999918619792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,65536,0.6827349344889323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,512,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,768,0.026898133754730224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,256,0.022731733322143555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,128,0.022051199277242025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,64,0.021569067239761354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,4096,32,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,10240,0.11499520142873128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,12288,0.12806933720906574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,16384,0.17046079635620118
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,8192,0.09468586444854736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,7168,0.08424106438954672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,6144,0.07266666889190673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,4096,0.054271999994913736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,5120,0.06580906709035238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,3584,0.051643733183542886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,3072,0.04634026686350505
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,2560,0.043383467197418216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,1536,0.034542934099833174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,1024,0.029765333731969195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,2048,0.03672746817270915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,65536,0.6807551701863607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,768,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,512,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,128,0.019113600254058838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,256,0.022392533222834268
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,64,0.01952426632245382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3584,32,0.020207999149958293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,10240,0.09891733328501383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,12288,0.11612053712209065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,16384,0.15366826057434083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,7168,0.07355733712514242
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,8192,0.0816810687383016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,6144,0.06348906755447388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,4096,0.04962986707687378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,5120,0.057378133138020836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,3584,0.047172268231709794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,2560,0.037887998421986896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,3072,0.043212799231211345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,2048,0.03310933311780294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,1536,0.03113066752751668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,1024,0.0284661332766215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,65536,0.6142293294270833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,768,0.024984532594680788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,512,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,256,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,128,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,32,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,3072,64,0.020413867632548013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,12288,0.10881600379943848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,10240,0.09082880020141601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,16384,0.1469770590464274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,8192,0.07427413463592529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,6144,0.05915306806564331
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,7168,0.067686398824056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,5120,0.053350400924682614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,4096,0.045398398240407305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,3584,0.04314560095469157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,3072,0.040277334054311116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,2560,0.03686399857203166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,2048,0.032562132676442465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,65536,0.583407974243164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,1536,0.03078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,1024,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,768,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,256,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,512,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,128,0.019523199399312338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,32,0.018498132626215615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2560,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,16384,0.13482774098714193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,12288,0.09994133313496908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,10240,0.08492480119069418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,7168,0.06413653294245401
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,8192,0.06963199774424235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,6144,0.05543359915415445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,5120,0.0500053326288859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,4096,0.043621333440144856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,3584,0.04109653234481812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,3072,0.03891199827194214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,2560,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,2048,0.030854399998982745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,1536,0.029013333717981975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,65536,0.5379402796427409
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,1024,0.026012800137201947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,768,0.02409706711769104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,512,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,256,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,128,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,2048,32,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,10240,0.07837013403574625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,16384,0.12486186822255452
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,12288,0.09321813583374024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,8192,0.0634879986445109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,7168,0.06086080074310303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,6144,0.05195200045903524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,5120,0.047172268231709794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,4096,0.04102933406829834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,3584,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,3072,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,2560,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,2048,0.02969599962234497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,1536,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,1024,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,65536,0.5153450647989909
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,768,0.023894399404525757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,512,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,256,0.018703999121983846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,32,0.017612799008687337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1536,64,0.018024533987045288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,16384,0.11594879627227783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,12288,0.08390080134073893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,10240,0.06987093289693197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,7168,0.053931732972462974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,8192,0.05901653369267782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,6144,0.04720640182495117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,5120,0.04498773415883382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,4096,0.03850133419036865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,3584,0.03502080043156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,2560,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,3072,0.03351999918619792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,2048,0.027852799495061236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,1024,0.024301866690317787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,1536,0.027853866418202717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,65536,0.4721664110819499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,768,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,512,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,256,0.01877440015474955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,128,0.017339734236399333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,32,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,1024,64,0.01658986707528432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,12288,0.0815445343653361
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,16384,0.11154773235321044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,10240,0.06894933382670085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,8192,0.05536426703135172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,7168,0.053282133738199865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,6144,0.0472053329149882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,4096,0.03768320083618164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,5120,0.04300800164540609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,3584,0.03645546833674113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,2560,0.030956800778706866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,3072,0.03303999900817871
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,2048,0.02826346755027771
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,1536,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,65536,0.43970559438069656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,1024,0.023142399390538533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,768,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,256,0.019318399826685588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,512,0.02068586746851603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,128,0.017885865767796834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,64,0.01699840029080709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,768,32,0.01699626644452413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,10240,0.06413546800613404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,16384,0.10792960325876873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,12288,0.07621973355611165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,8192,0.054647465546925865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,7168,0.04918613433837891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,6144,0.043075199921925864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,4096,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,5120,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,3584,0.03406613270441691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,2560,0.030584534009297688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,3072,0.031269333759943646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,2048,0.026419200499852497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,65536,0.42618878682454425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,1536,0.02648640076319377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,1024,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,768,0.022459733486175536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,512,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,512,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,16384,0.10321919918060303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,12288,0.0723626693089803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,10240,0.059563732147216795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,7168,0.04652373393376668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,8192,0.05130240122477213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,6144,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,5120,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,4096,0.03290346662203471
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,3584,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,3072,0.03078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,2560,0.028398933013280232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,2048,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,65536,0.4033194541931152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,1536,0.02471359968185425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,1024,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,768,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,256,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,512,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,128,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,256,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,16384,0.10024853547414143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,12288,0.06833493709564209
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,10240,0.05717333157857259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,7168,0.04614826838175456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,8192,0.049356798330942794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,6144,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,5120,0.038571735223134354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,4096,0.03324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,3584,0.03269973397254944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,3072,0.030789333581924438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,2560,0.027373866240183516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,2048,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,65536,0.398472531636556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,1536,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,1024,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,768,0.02068586746851603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,512,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,128,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,128,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,10240,0.05789120197296142
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,16384,0.09755307038625081
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,12288,0.06830080350240073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,8192,0.05034666856129964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,7168,0.04533119996388753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,6144,0.039800532658894855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,4096,0.03290560046831767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,5120,0.037478399276733396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,3584,0.0315391997496287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,2560,0.028603732585906982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,3072,0.029285333553949994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,2048,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,65536,0.3934218724568685
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,1536,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,1024,0.02258346676826477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,768,0.020617600282033285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,512,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,256,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,128,0.01692906618118286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,64,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,16384,0.1013760010401408
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,12288,0.06751573085784912
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,10240,0.05806080102920532
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,7168,0.045124268531799315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,8192,0.05123413403828939
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,6144,0.04041386842727661
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,5120,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,4096,0.03285119930903117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,3584,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,3072,0.030478932460149127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,2560,0.027239465713500978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,2048,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,65536,0.3919189453125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,1536,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,1024,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,768,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,512,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,128,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,32,0.016759467124938966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2048,32,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,12288,0.5451775868733724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,10240,0.44530665079752607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,8192,0.3634869257609049
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,16384,0.7043039957682292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,7168,0.32785065968831384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,4096,0.19083840052286785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,6144,0.2719061215718587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,5120,0.23353919982910157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,2560,0.12574613094329834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,3072,0.1497770627339681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,3584,0.17223679224650065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,2048,0.10639359951019287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,1536,0.08622079690297445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,1024,0.06963199774424235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,768,0.05997333526611328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,512,0.05311146577199301
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,256,0.04942506551742554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,128,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,64,0.04177920023600261
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,65536,32,0.04198293288548787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,12288,0.17558186848958332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,16384,0.2276085376739502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,10240,0.1491626739501953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,8192,0.12325653235117595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,7168,0.11441706816355388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,6144,0.09811840057373047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,4096,0.06741440296173096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,5120,0.08502613703409831
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,3584,0.06686506271362305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,65536,0.8396117528279623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,3072,0.059528533617655435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,2560,0.051369599501291906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,2048,0.045124268531799315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,1536,0.04082346757253011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,1024,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,768,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,256,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,128,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,512,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,64,0.025124265750249224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,16384,32,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,12288,0.13561174074808757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,10240,0.11980799833933513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,16384,0.18459307352701823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,8192,0.09618879954020182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,7168,0.08826879660288492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,6144,0.07973439693450927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,4096,0.057241598765055336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,5120,0.06898240248362222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,3584,0.05519359906514486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,65536,0.7165290832519531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,3072,0.05120000044504801
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,2560,0.045259733994801835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,2048,0.04061973492304484
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,1536,0.036933334668477376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,1024,0.031675734122594196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,768,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,256,0.026078933477401735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,128,0.02402879993120829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,512,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,64,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,12288,32,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,12288,0.12892159620920818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,10240,0.10953386624654134
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,16384,0.16377065976460775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,8192,0.08785920143127442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,7168,0.08530133565266927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,6144,0.07349013487497966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,5120,0.06365866661071777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,4096,0.05464640061060587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,65536,0.621669324239095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,2560,0.04430506626764934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,3072,0.04724053144454956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,2048,0.038228265444437665
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,1536,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,1024,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,768,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,512,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,256,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,128,0.022050132354100548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,64,0.022258132696151733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,32,0.021027199427286782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,12288,0.10803199609120687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,16384,0.13837547302246095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,8192,0.07990612983703613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,10240,0.09468479951222739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,65536,0.5109077453613281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,7168,0.07533120314280192
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,6144,0.06464853286743164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,5120,0.0553984006245931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,4096,0.049459199110666915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,3584,0.04669440189997355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,3072,0.043212799231211345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,2560,0.041493332386016844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,2048,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,1536,0.03140160044034322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,1024,0.028535467386245728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,768,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,512,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,256,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,128,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,64,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,8192,32,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,12288,0.09656319618225098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,16384,0.11885333061218262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,8192,0.0740010658899943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,10240,0.08983893394470215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,65536,0.4776277224222819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,7168,0.07045119603474935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,6144,0.06140480041503906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,4096,0.04638933340708415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,5120,0.053452801704406736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,3072,0.04246079921722412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,2560,0.038228265444437665
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,2048,0.034815998872121175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,1536,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,1024,0.02655679980913798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,768,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,512,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,256,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,128,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,32,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,16384,0.11489280064900716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,12288,0.09165759881337485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,65536,0.45970665613810224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,10240,0.07980373700459799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,7168,0.0617141326268514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,8192,0.06563839912414551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,6144,0.05505706469217936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,5120,0.04904959996541341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,4096,0.04300800164540609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,3584,0.04109760125478108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,3072,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,2560,0.03502080043156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,2048,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,1536,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,1024,0.026146133740743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,768,0.022665599981943764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,512,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,256,0.021230934063593547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,128,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,64,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,6144,32,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,16384,0.10639253457387288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,12288,0.08417279720306396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,65536,0.41465174357096357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,10240,0.07181546688079835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,8192,0.059868800640106204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,7168,0.05543359915415445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,6144,0.05027840137481689
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,5120,0.04485119978586833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,3584,0.03911573489507039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,4096,0.039661868413289385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,3072,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,2560,0.034543999036153156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,2048,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,1536,0.027852799495061236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,1024,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,768,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,512,0.022459733486175536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,256,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,128,0.019387733936309815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,5120,32,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,16384,0.09294613202412924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,12288,0.07345386346181235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,65536,0.35495360692342126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,10240,0.06509226560592651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,8192,0.05491733153661092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,7168,0.05130240122477213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,5120,0.04150613149007161
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,6144,0.04690026839574178
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,4096,0.037001601854960126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,3584,0.03631893396377563
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,3072,0.034065067768096924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,2560,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,2048,0.028809599081675213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,1536,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,1024,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,768,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,512,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,64,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,4096,32,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,16384,0.0932522694269816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,12288,0.07341972986857095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,65536,0.37451092402140296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,10240,0.06703786849975586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,8192,0.05502293507258097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,7168,0.051438931624094644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,6144,0.04771840174992879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,5120,0.043075199921925864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,3584,0.037001601854960126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,4096,0.037273601690928145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,3072,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,2560,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,2048,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,1536,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,1024,0.024029866854349772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,768,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,512,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,128,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,64,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3584,32,0.017889066537221273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,16384,0.08157973289489746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,12288,0.0642410675684611
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,65536,0.3400725364685059
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,10240,0.05741226673126221
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,8192,0.04922026793162028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,7168,0.04717333316802978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,5120,0.03925333420435588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,6144,0.043075199921925864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,4096,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,3584,0.03310826619466146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,3072,0.03256426652272542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,2560,0.030037333567937214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,2048,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,1536,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,1024,0.0230730672677358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,768,0.021230934063593547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,512,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,256,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,64,0.016794667641321818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,3072,32,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,16384,0.07669760386149088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,12288,0.06082559823989868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,65536,0.32010132471720376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,10240,0.05338346560796102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,8192,0.04710400104522705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,7168,0.045534932613372804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,6144,0.04116586844126384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,5120,0.03741013209025065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,3584,0.03297280073165894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,4096,0.03317760030428569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,3072,0.030789333581924438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,2560,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,2048,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,1536,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,1024,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,768,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,512,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,256,0.017682133118311565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,128,0.01781760056813558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2560,32,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,16384,0.07181653181711832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,12288,0.0556714653968811
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,65536,0.29402453104654946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,10240,0.051269332567850746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,8192,0.04341866572697957
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,7168,0.04109653234481812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,5120,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,6144,0.038571735223134354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,4096,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,3584,0.030243200063705445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,3072,0.028807467222213744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,2560,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,2048,0.02512213389078776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,1536,0.022935465971628825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,1024,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,768,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,512,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,256,0.017338667313257852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,128,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,64,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,2048,32,0.017682133118311565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,10240,3584,0.051369599501291906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,16384,0.06560320059458415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,12288,0.05314559936523437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,10240,0.04918613433837891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,65536,0.2602997303009033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,7168,0.04109653234481812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,8192,0.04109653234481812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,5120,0.03331306576728821
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,6144,0.03686399857203166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,4096,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,3584,0.028809599081675213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,3072,0.02805759906768799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,2560,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,2048,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,1536,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,1024,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,768,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,512,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,128,0.01795413295427958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,256,0.017884800831476845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,64,0.01693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1536,32,0.017542399962743125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,16384,0.06280533472696939
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,12288,0.050653866926829015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,10240,0.04686506589253743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,8192,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,6144,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,7168,0.03795733451843262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,65536,0.24698774019877115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,5120,0.031402667363484696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,4096,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,3584,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,3072,0.027102933327356978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,2560,0.02553173303604126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,2048,0.024166399240493776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,1536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,1024,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,768,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,512,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,256,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,64,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,1024,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,16384,0.06045013268788656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,12288,0.04775253136952718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,7168,3584,0.046077867348988846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,7168,0.0370688001314799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,10240,0.044853333632151285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,8192,0.03843520085016887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,6144,0.0341322660446167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,5120,0.030583467086156207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,65536,0.22981866200764975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,4096,0.027237333854039508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,2560,0.024781866868336996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,3584,0.028193066517512005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,3072,0.026555732885996504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,2048,0.023348265886306764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,1536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,1024,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,768,0.01911466717720032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,256,0.0182261327902476
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,128,0.01775146722793579
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,64,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,768,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,12288,0.047133866945902506
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,16384,0.059563732147216795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,10240,0.04170986811319987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,7168,0.03624853293100993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,8192,0.036865067481994626
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,6144,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,5120,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,4096,0.026898133754730224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,65536,0.22463146845499674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,3584,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,3072,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,2560,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,2048,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,1024,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,768,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,256,0.017407999436060587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,16384,0.055569068590799964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,12288,0.04519146680831909
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,10240,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,8192,0.036931200822194414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,65536,0.20933866500854492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,6144,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,7168,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,3584,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,5120,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,2048,0.022731733322143555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,3072,0.026280534267425538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,2560,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,1024,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,128,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,64,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,16384,0.05276906490325928
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,12288,0.045124268531799315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,65536,0.2047658602396647
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,10240,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,8192,0.03590826590855916
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,7168,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,6144,0.03126506606737773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,5120,0.028945066531499225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,4096,0.026691200335820515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,3584,0.026690133412679035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,3072,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,2560,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,2048,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,1536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,1024,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,768,0.01966080069541931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,512,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,256,0.017545600732167564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,128,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,16384,0.049628798166910806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,12288,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,65536,0.20599466959635415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,10240,0.04102933406829834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,8192,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,7168,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,6144,0.03174399932225545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,5120,0.029013333717981975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,3584,0.026691200335820515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,3072,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,2560,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,1536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,1024,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,768,0.01966080069541931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,256,0.016587733229001363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,512,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,64,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,64,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,16384,0.05130240122477213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,12288,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,65536,0.20264959335327148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,10240,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,8192,0.0362496018409729
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,7168,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,6144,0.031470932563145954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,5120,0.029422932863235475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,3584,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,3072,0.02655679980913798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,2560,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,2048,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,1536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,768,0.019933867454528808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,1024,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,128,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,64,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,32,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,16384,0.5827957153320312
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,12288,0.43246933619181316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,10240,0.3771733283996582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,8192,0.2983263969421387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,6144,0.22504107157389322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,7168,0.264465061823527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,4096,0.15967466036478678
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,5120,0.18968000411987304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,3072,0.1318559964497884
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,3584,0.14199573198954266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,2048,0.09724586804707845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,2560,0.11475626627604167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,1024,0.06382933457692465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,1536,0.07990612983703613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,768,0.057241598765055336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,512,0.05140479803085327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,256,0.0476149320602417
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,128,0.036111998558044436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,64,0.03563520113627116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,65536,32,0.0370688001314799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,16384,0.1796778678894043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,12288,0.13981013298034667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,10240,0.12253866990407307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,65536,0.6705834706624348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,8192,0.09520959854125977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,7168,0.08601706822713216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,5120,0.06751573085784912
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,6144,0.07485439777374267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,4096,0.06099520126978556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,3584,0.05457813342412313
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,3072,0.0506880005200704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,2560,0.04450986782709758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,2048,0.04109653234481812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,1536,0.0348853349685669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,1024,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,768,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,512,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,256,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,128,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,64,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,16384,32,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,16384,0.13554347356160482
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,12288,0.10806612968444824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,65536,0.5073237419128418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,10240,0.09642666975657145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,8192,0.07990612983703613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,7168,0.07365972995758056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,6144,0.0634879986445109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,5120,0.058266667524973545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,4096,0.05130240122477213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,3584,0.04857279856999715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,3072,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,2560,0.039867734909057616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,2048,0.03625066677729289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,1536,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,768,0.025257599353790284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,1024,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,512,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,256,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,128,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,64,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,12288,32,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,16384,0.12509866555531818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,12288,0.09980586369832357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,65536,0.4733951886494954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,10240,0.08485759894053141
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,8192,0.07167999744415283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,7168,0.06550186475118001
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,6144,0.057513598601023355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,5120,0.05232640107472738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,4096,0.046284798781077066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,3584,0.04457919994990031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,3072,0.03945813179016113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,2560,0.037138132254282634
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,2048,0.03338346481323242
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,1536,0.030583467086156207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,1024,0.02764906684557597
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,768,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,512,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,256,0.023004800081253052
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,64,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,128,0.020750933885574342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,10240,32,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,16384,0.10905600388844808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,12288,0.08813119729359944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,65536,0.4042069435119629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,10240,0.07672853469848633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,8192,0.06451520125071207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,7168,0.059393068154652916
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,6144,0.05181546608606974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,5120,0.04806079864501953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,4096,0.042803200085957845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,3584,0.04116479953130086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,3072,0.03713599840799968
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,2560,0.03508906761805217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,2048,0.031402667363484696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,1536,0.02956053415934245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,1024,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,768,0.02321173350016276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,512,0.02177600065867106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,256,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,128,0.020275199413299562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,64,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,8192,32,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,16384,0.09598186810811361
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,512,1536,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,12288,0.07768747011820475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,65536,0.364851188659668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,10240,0.0698357343673706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,8192,0.05956159830093384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,7168,0.05447786649068197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,6144,0.048196268081665036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,5120,0.04437333345413208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,4096,0.0413696010907491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,3072,0.03515733480453491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,3584,0.037409067153930664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,2560,0.03304106593132019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,2048,0.030105600754419964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,1536,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,1024,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,768,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,256,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,512,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,7168,32,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1024,256,1536,0.022498132785161336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,16384,0.09086293379465739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,10240,0.06440960168838501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,12288,0.07341972986857095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,8192,0.056524801254272464
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,7168,0.05000426769256592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,6144,0.04526079893112182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,65536,0.3322197278340658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,5120,0.04314346710840861
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,4096,0.03911679983139038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,3584,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,3072,0.034747731685638425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,2560,0.03249386747678121
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,2048,0.030447999636332195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,1024,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,768,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,512,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,1536,0.025870933135350542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,64,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,6144,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,12288,0.07007573445638021
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,16384,0.08680000305175781
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,10240,0.06297599871953329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,8192,0.05341973304748535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,7168,0.049322664737701416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,6144,0.043828264872233076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,5120,0.04130133390426636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,65536,0.3297621409098307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,4096,0.03850239912668864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,3584,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,3072,0.03392959833145141
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,2560,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,2048,0.029288534323374433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,1536,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,1024,0.022665599981943764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,768,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,512,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,64,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,5120,32,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,10240,0.054271999994913736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,16384,0.07581013043721517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,12288,0.061508266131083164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,7168,0.04485119978586833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,8192,0.047888000806172684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,6144,0.03973013162612915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,65536,0.2891093254089355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,5120,0.03884373505910237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,4096,0.035361067454020186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,3584,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,2560,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,2048,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,1536,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,1024,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,768,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,512,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,128,0.01726933320363363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,32,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,16384,0.07137280305226644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,12288,0.057275732358296715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,10240,0.05191680192947388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,8192,0.045124268531799315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,65536,0.27286081314086913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,7168,0.04300800164540609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,5120,0.03543039957682292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,6144,0.03850133419036865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,4096,0.034679468472798666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,3584,0.031267199913660684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,3072,0.030105600754419964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,2560,0.028603732585906982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,2048,0.02519039909044902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,1536,0.022665599981943764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,1024,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,768,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,512,0.01904746691385905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3584,32,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,16384,0.06765120029449463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,12288,0.053624534606933595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,10240,0.04945813417434693
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,65536,0.2516991933186849
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,8192,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,7168,0.04096000194549561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,6144,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,5120,0.034109866619110106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,4096,0.03222186764081319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,3584,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,3072,0.027513599395751952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,2560,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,2048,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,1536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,1024,0.020886399348576865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,768,0.019388800859451293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,3072,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,16384,0.06440960168838501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,12288,0.051541332403818765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,10240,0.047856001059214275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,8192,0.04198400179545085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,65536,0.237772798538208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,7168,0.03911679983139038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,5120,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,6144,0.03584213256835937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,4096,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,3584,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,3072,0.028194133440653486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,2560,0.026691200335820515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,2048,0.02464639941851298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,1536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,1024,0.020890667041142782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,768,0.018910932540893554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,256,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,64,0.0173418660958608
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2560,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,16384,0.06021120150883993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,12288,0.04894719918568929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,10240,0.04720746676127116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,65536,0.21869227091471352
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,8192,0.03952639897664388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,7168,0.037546666463216145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,6144,0.034883201122283936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,5120,0.03126613299051921
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,4096,0.030242133140563964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,3584,0.028467200199762982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,3072,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,2560,0.025600000222524004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,2048,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,1536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,1024,0.021434666713078816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,768,0.0188426673412323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,64,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,2048,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,16384,0.056968533992767335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,12288,0.047172268231709794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,10240,0.04437439839045207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,65536,0.2035370667775472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,8192,0.037001601854960126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,7168,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,6144,0.03297386765480041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,5120,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,4096,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,3584,0.026759467522303265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,3072,0.02621440092722575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,2560,0.024689066410064697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,2048,0.022802132368087768
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,1024,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,1536,0.02129813234011332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,256,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1536,32,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,16384,0.05577386617660522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,12288,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,10240,0.04130239884058635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,65536,0.18547840118408204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,8192,0.03672746817270915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,7168,0.03365653355916341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,6144,0.030583467086156207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,5120,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,4096,0.02744213342666626
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,3584,0.02573653260866801
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,2560,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,3072,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,1536,0.021233065923055013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,1024,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,768,0.018569600582122803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,256,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,128,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,1024,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,16384,0.053350400924682614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,12288,0.04314560095469157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,10240,0.03973226547241211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,65536,0.1751050631205241
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,8192,0.03481493393580119
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,7168,0.03287039995193482
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,6144,0.030105600754419964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,4096,0.02696746587753296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,5120,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,3584,0.02662293314933777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,3072,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,2560,0.023075199127197264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,1536,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,2048,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,1024,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,768,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,512,0.018161066373189292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,128,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,768,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,16384,0.049356798330942794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,12288,0.04396373430887858
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,10240,0.03870720068613688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,65536,0.16814079284667968
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,8192,0.03338239987691243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,7168,0.03283733328183492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,6144,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,5120,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,3584,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,2560,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,3072,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,1536,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,1024,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,768,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,512,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,128,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,512,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,16384,0.046216531594594316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,12288,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,8192,0.03372373183568318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,10240,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,65536,0.1613141377766927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,7168,0.03242666721343994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,6144,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,5120,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,3584,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,2560,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,3072,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,1536,0.0211626668771108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,1024,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,256,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,256,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,16384,0.043894398212432864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,12288,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,8192,0.03304106593132019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,10240,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,65536,0.1555829366048177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,6144,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,7168,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,5120,0.02723840077718099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,3584,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,2560,0.02362133264541626
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,2048,0.02177813251813253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,3072,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,1536,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,1024,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,768,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,512,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,64,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,128,32,0.016244266430536905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,16384,0.04334933360417684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,12288,0.037069865067799884
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,10240,0.036933334668477376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,65536,0.15503466924031575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,7168,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,6144,0.029285333553949994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,5120,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,3584,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,4096,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,3072,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,2560,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,1024,0.019523199399312338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,768,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,256,0.01651946703592936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,64,0.015220266580581666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,32,0.01665600041548411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,65536,0.1572864055633545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,16384,0.04307733376820882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,12288,0.0370688001314799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,10240,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,8192,0.033725865681966144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,7168,0.0315391997496287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,6144,0.030105600754419964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,5120,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,4096,3072,0.03078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,4096,0.026147200663884478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,3584,0.02512213389078776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,3072,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,2560,0.022663466135660806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,2048,0.02211946646372477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,1024,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,512,0.017681066195170084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,128,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,16384,0.391645876566569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,12288,0.3019434611002604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,10240,0.24016213417053223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,8192,0.1937727928161621
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,7168,0.17237332661946614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,6144,0.1508021354675293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,5120,0.12827306588490803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,4096,0.10601812998453777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,3584,0.09458346366882324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,3072,0.08410453001658122
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,2560,0.07424000104268393
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,2048,0.064683731396993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,1536,0.05532906850179037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,1024,0.04519253174463908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,768,0.04034239848454793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,512,0.0357045332590739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,256,0.03317760030428569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,128,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,64,0.03249599933624268
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,65536,32,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,65536,0.4207274754842122
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,16384,0.11977386474609375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,12288,0.09693866570790609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,10240,0.08362560272216797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,8192,0.06986880302429199
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,7168,0.06642346779505412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,6144,0.061508266131083164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,5120,0.05502293507258097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,4096,0.04734186728795369
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,3584,0.04457919994990031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,3072,0.04089173475901286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,2560,0.03788906733194987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,2048,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,1536,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,1024,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,768,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,512,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,256,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,128,0.022322134176890055
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,64,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,16384,32,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,65536,0.3505162556966146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,16384,0.09844160079956055
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,12288,0.08052053451538085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,10240,0.06925653616587321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,8192,0.05796053409576416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,7168,0.05549973249435425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,6144,0.05198506514231364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,5120,0.04679679870605469
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,4096,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,3584,0.03884479999542236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,3072,0.03590826590855916
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,2560,0.03311040004094441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,2048,0.030789333581924438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,1536,0.028195200363794963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,1024,0.024437334140141806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,768,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,512,0.022459733486175536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,256,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,128,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,64,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,12288,32,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,65536,0.3170986811319987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,16384,0.09308160146077474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,12288,0.0771071990331014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,10240,0.06352213223775229
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,8192,0.05403306484222412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,7168,0.051268267631530764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,6144,0.04751360019048055
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,5120,0.04246079921722412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,4096,0.03836693366368611
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,3584,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,3072,0.03358613252639771
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,2560,0.032152533531188965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,2048,0.029765333731969195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,1536,0.02696746587753296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,1024,0.024098134040832518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,768,0.022392533222834268
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,512,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,256,0.019115734100341796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,10240,32,0.01972800095876058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,65536,0.2646666685740153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,8192,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,16384,0.0781994660695394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,12288,0.0665183981259664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,10240,0.05761706829071045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,8192,0.04922026793162028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,7168,0.04727466503779094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,6144,0.043280001481374106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,5120,0.040550398826599124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,4096,0.036659200986226395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,3584,0.03495146830876668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,3072,0.03269973397254944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,64,512,0.017681066195170084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,2560,0.030855466922124226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,2048,0.028195200363794963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,1536,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,1024,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,768,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,512,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,256,0.018706132968266807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,128,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,64,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,8192,32,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,12288,0.06328213214874268
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,16384,0.07512853145599366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,10240,0.05522773265838623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,8192,0.047378134727478025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,65536,0.25886720021565757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,7168,0.04526079893112182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,6144,0.04300800164540609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,5120,0.038430933157602945
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,4096,0.03536213239034017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,3584,0.03379093408584595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,3072,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,2560,0.030105600754419964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,2048,0.027922133604685467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,1536,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,1024,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,768,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,512,0.018637865781784058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,128,0.01802133321762085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,64,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,7168,32,0.016860800981521606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,16384,0.067413330078125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,12288,0.05850453376770019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,10240,0.04986986716588338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,8192,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,65536,0.23961599667867026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,7168,0.041303467750549314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,6144,0.03911786476771037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,5120,0.03720426559448242
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,3584,0.032152533531188965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,3072,0.030447999636332195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,4096,0.03317866722742717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,2560,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,2048,0.02648746569951375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,1536,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,1024,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,768,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,256,0.018567466735839845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,64,0.016999467213948568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,6144,32,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,16384,0.06297706762949626
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,12288,0.05500906705856323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,10240,0.046452267964680986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,8192,0.040381864706675215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,65536,0.2274986743927002
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,768,32,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,7168,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,6144,0.037137067317962645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,5120,0.03508906761805217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,4096,0.031473066409428915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,3584,0.03078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,3072,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,2560,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,1024,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,768,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,2048,0.024781866868336996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,1536,0.02245866656303406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,256,0.018228266636530557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,128,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,5120,32,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,16384,0.05937920014063517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,12288,0.04894826809565227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,10240,0.042734932899475095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,8192,0.037205334504445395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,6144,0.03505386511484782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,65536,0.19527680079142254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,7168,0.0362496018409729
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,5120,0.03263253370920817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,4096,0.030514132976531983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,3584,0.029013333717981975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,3072,0.02723840077718099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,2048,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,2560,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,1536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,1024,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,768,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,64,0.016455466548601784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,32,0.017614932854970296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,4096,128,0.017612799008687337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,12288,0.04747946659723918
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,16384,0.056797866026560465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,10240,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,65536,0.18547946612040203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,7168,0.03563520113627116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,8192,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,6144,0.03351999918619792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,4096,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,5120,0.03140373428662618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,3584,0.02723840077718099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,3072,0.02525866627693176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,2560,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,1536,0.02157333294550578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,1024,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,128,0.017339734236399333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,64,0.016658133268356322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3584,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,12288,0.0466261347134908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,16384,0.053521064917246494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,10240,0.04089173475901286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,7168,0.03556693394978841
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,8192,0.03659093379974365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,6144,0.03297280073165894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,65536,0.1632256031036377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,5120,0.03208746711413066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,4096,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,3584,0.026689066489537554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,3072,0.02518933415412903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,2560,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,1536,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,1024,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,768,0.019182932376861573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,512,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,256,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,64,0.016790399948755898
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,32,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,3072,128,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,12288,0.04491946697235107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,16384,0.049322664737701416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,10240,0.037614933649698895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,65536,0.15721920331319172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,8192,0.034883201122283936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,7168,0.03351893424987793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,6144,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,3584,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,5120,0.030105600754419964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,4096,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,3072,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,2560,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,1536,0.02177813251813253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,2048,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,768,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,1024,0.018908800681432088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,128,0.016450132926305136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,64,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2560,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,12288,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,16384,0.04911786715189616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,10240,0.038230399290720626
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,65536,0.14124372800191243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,7168,0.03290346662203471
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,8192,0.03399786551793416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,6144,0.03065173427263896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,5120,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,4096,0.026281599203745527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,3584,0.025464532772699992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,1536,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,3072,0.024371200799942018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,1024,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,768,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,512,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,256,0.016438399751981102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,128,0.0169322669506073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,64,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,2048,32,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,12288,0.04102720022201538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,16384,0.04710293213526408
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,10240,0.035974399248758955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,7168,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,8192,0.03283519943555196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,6144,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,65536,0.13178986708323162
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,5120,0.028194133440653486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,4096,0.026012800137201947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,3584,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,3072,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,2048,0.02198186715443929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,512,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,32,0.01781760056813558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1536,64,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,12288,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,16384,0.04539733330408732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,10240,0.03331519961357117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,65536,0.12076373100280761
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,7168,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,6144,0.02805759906768799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,4096,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,5120,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,3072,0.023209599653879802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,3584,0.024166399240493776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,2560,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,2048,0.02130026618639628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,1536,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,512,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,128,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,64,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,16384,0.043755733966827394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,12288,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,65536,0.11670186519622802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,10240,0.03344959815343221
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,8192,0.029419734080632524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,7168,0.02935466567675273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,6144,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,5120,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,4096,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,3584,0.023960532744725545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,2560,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,2048,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,768,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,512,0.01781760056813558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,256,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,128,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,768,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,16384,0.04109653234481812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,12288,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,10240,0.033129600683848064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,8192,0.028945066531499225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,65536,0.11171840031941731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,7168,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,6144,0.02764799992243449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,5120,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,4096,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,3584,0.023756800095240276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,3072,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,1536,0.01952426632245382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,768,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,512,0.01713493267695109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,256,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,64,0.016999467213948568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,512,32,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,16384,0.03898133436838786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,12288,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,10240,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,8192,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,65536,0.105404798189799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,7168,0.02874133388201396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,6144,0.026829866568247478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,5120,0.02573653260866801
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,4096,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,3584,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,1536,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,768,0.01802240014076233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,512,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,64,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,128,0.015361066659291586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,256,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,12288,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,65536,0.1008639971415202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,8192,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,7168,0.028194133440653486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,6144,0.027102933327356978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,3584,0.02450666626294454
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,4096,0.02403093377749125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,5120,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,2560,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,2048,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,1536,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,768,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,512,0.017816533644994102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,128,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,128,32,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,12288,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,16384,0.03543146848678589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,10240,0.031948800881703696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,65536,0.09898666540781656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,8192,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,6144,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,7168,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,5120,0.026694399118423463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,4096,0.026077866554260254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,3584,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,2560,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,1536,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,768,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,512,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,128,0.015359999736150107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,64,32,0.01570026675860087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,16384,0.036933334668477376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,12288,0.03331413269042969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,65536,0.09803093274434407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,8192,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,7168,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,5120,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,6144,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,4096,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,3584,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,3072,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,2560,0.022050132354100548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,1536,0.01904639999071757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,768,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,512,0.01699840029080709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,128,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,32,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,12288,0.22770346005757652
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,16384,0.30924800237019856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,10240,0.19588586489359539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,8192,0.16233919461568197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,7168,0.14513492584228516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,6144,0.12482559680938721
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,5120,0.104584534962972
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,4096,0.09000960191090902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,3584,0.07976960341135661
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,3072,0.07055359681447347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,2560,0.06417066653569539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,2048,0.05549973249435425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,1536,0.0475818673769633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,1024,0.039527467886606854
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,512,0.031879466772079465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,256,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,768,0.03515413204828898
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,128,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,64,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,65536,32,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,16384,0.10287893613179525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,12288,0.08099839687347413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,10240,0.0784714698791504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,65536,0.33870506286621094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,8192,0.06850666999816894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,7168,0.0630783994992574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,6144,0.057241598765055336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,5120,0.05075733264287313
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,4096,0.044715734322865804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,3584,0.040686933199564616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,3072,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,2560,0.033928533395131424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,2048,0.031198932727177935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,1536,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,768,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,1024,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,256,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,128,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,512,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,64,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,16384,32,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,16384,0.0843775987625122
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,12288,0.06874240239461263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,10240,0.06386239926020304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,65536,0.2750464121500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,8192,0.0575488011042277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,7168,0.05249493519465128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,5120,0.04212053219477336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,6144,0.048230401674906415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,4096,0.03720426559448242
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,3584,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,3072,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,2560,0.030925865968068438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,2048,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,1536,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,1024,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,768,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,256,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,128,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,512,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,12288,32,0.01651946703592936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,16384,0.08226666450500489
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,12288,0.06594773530960082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,10240,0.06164480050404867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,65536,0.2612565358479818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,8192,0.050892798105875645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,7168,0.04628586769104004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,5120,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,6144,0.04177920023600261
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,4096,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,3584,0.03351893424987793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,3072,0.03113066752751668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,2560,0.030105600754419964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,2048,0.028467200199762982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,1536,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,1024,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,768,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,512,0.01945706605911255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,64,0.01952426632245382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,10240,32,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,16384,0.07461439768473307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,12288,0.059630934397379556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,65536,0.22339946428934732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,10240,0.053384534517923986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,8192,0.0474453330039978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,6144,0.03959360122680664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,5120,0.03597653309504191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,7168,0.043622398376464845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,4096,0.03304106593132019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,3584,0.03078719973564148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,3072,0.030036266644795733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,2560,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,2048,0.026215465863545735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,1536,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,1024,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,768,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,512,0.02027413249015808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,64,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,8192,32,0.017153066396713258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,16384,0.06734506289164224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,12288,0.05368533531824747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,65536,0.20155733426411948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,10240,0.048810664812723795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,8192,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,7168,0.04041386842727661
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,6144,0.036999468008677164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,4096,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,5120,0.03379199902216594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,3584,0.030445865790049237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,3072,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,2048,0.025326933463414508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,2560,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,1536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,1024,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,768,0.019320533672968546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,128,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,32,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,7168,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,12288,0.051437866687774655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,16384,0.06546133359273275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,8192,0.04171093304951985
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,10240,0.046419199307759604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,65536,0.1805631955464681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,7168,0.039049601554870604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,6144,0.035086933771769205
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,5120,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,4096,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,3584,0.029219200213750202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,3072,0.027102933327356978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,2560,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,2048,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,1024,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,1536,0.021025067567825316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,768,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,256,0.01651946703592936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,64,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,6144,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,16384,0.06048426628112793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,12288,0.04748053153355916
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,10240,0.04328213135401408
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,65536,0.16977920532226562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,8192,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,7168,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,5120,0.03099306623140971
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,6144,0.034270934263865155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,4096,0.030036266644795733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,3584,0.027988266944885255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,3072,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,2560,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,512,1024,8192,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,2048,0.023822933435440063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,1536,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,1024,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,768,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,128,0.017543466885884602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,64,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,5120,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,12288,0.04746880133946736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,10240,0.04109760125478108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,16384,0.056184534231821695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,65536,0.15202986399332682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,8192,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,7168,0.03426986535390218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,6144,0.032631466786066696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,5120,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,4096,0.02874133388201396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,3584,0.024987733364105223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,3072,0.024577067295710246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,2048,0.02321066657702128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,1024,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,768,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,64,0.017543466885884602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,32,0.017612799008687337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,4096,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,12288,0.04382933378219604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,16384,0.05362240076065063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,10240,0.03932266632715861
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,65536,0.1426090717315674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,8192,0.034953598181406656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,7168,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,6144,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,5120,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,3584,0.02648853262265523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,4096,0.027374933163324993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,2560,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,3072,0.023552000522613525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,2048,0.02198186715443929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,512,0.018362667163213095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,768,0.017950934171676636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,128,0.01672640045483907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,32,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3584,64,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,12288,0.04116479953130086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,10240,0.0370688001314799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,16384,0.04863893191019694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,65536,0.1325055996576945
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,6144,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,8192,0.03495146830876668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,7168,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,4096,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,3584,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,3072,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,5120,0.028535467386245728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,2048,0.021572266022364298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,1536,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,512,0.0184714674949646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,3072,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,12288,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,10240,0.037206399440765384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,16384,0.04703679879506429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,65536,0.12506453196207684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,8192,0.03338666756947835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,7168,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,6144,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,5120,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,4096,0.025191466013590496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,3584,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,2560,0.021780266364415487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,2048,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,768,0.018295466899871826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,128,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,16384,0.04746026595433553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,12288,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,65536,0.11591573556264241
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,10240,0.03529493411382039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,8192,0.032153600454330446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,7168,0.030857600768407184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,6144,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,5120,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,4096,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,3584,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,2560,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,2048,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,1536,0.019453867276509603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,1024,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,512,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,256,0.016862932840983072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,64,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2048,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,16384,0.04430506626764934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,12288,0.03686399857203166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,10240,0.03303999900817871
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,8192,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,65536,0.10240000089009602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,7168,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,6144,0.028193066517512005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,4096,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,3584,0.023826134204864503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,2560,0.02116480072339376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,3072,0.02191466689109802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,2048,0.020822399854660036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,1536,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,768,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,1024,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,512,0.017748266458511353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,256,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,128,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1536,32,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,16384,0.04123946825663249
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,12288,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,10240,0.031948800881703696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,8192,0.030445865790049237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,65536,0.10093333721160888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,7168,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,6144,0.027169066667556762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,4096,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,3584,0.023414399226506552
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,3072,0.022050132354100548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,2560,0.020819199085235596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,2048,0.020615466435750327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,1024,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,1536,0.018565332889556883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,768,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,512,0.017409066359202065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,64,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,1024,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,16384,0.040209066867828366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,12288,0.03461013237635295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,65536,0.09239892959594727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,8192,0.02969706654548645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,6144,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,5120,0.025397332509358723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,7168,0.02778559923171997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,4096,0.023893332481384276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,3584,0.02286826570828756
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,3072,0.021708800395329794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,2560,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,1536,0.01863573392232259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,1024,0.018296533823013307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,768,0.018296533823013307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,128,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,64,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,768,32,0.015428266922632852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,16384,0.037546666463216145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,12288,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,65536,0.0869376023610433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,7168,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,8192,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,6144,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,4096,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,2560,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,2048,0.01911466717720032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,1536,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,1024,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,512,0.017410133282343546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,512,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,16384,0.035018666585286455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,12288,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,65536,0.08000853061676025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,8192,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,7168,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,6144,0.02635093331336975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,5120,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,3584,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,4096,0.02409706711769104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,2560,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,3072,0.021504000822703043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,256,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,256,32,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,12288,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,10240,0.02990506688753764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,8192,0.02908160090446472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,65536,0.07430933316548666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,7168,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,6144,0.027170133590698243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,5120,0.024029866854349772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,4096,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,3584,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,3072,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,1024,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,1536,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,768,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,512,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,128,32,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,16384,0.034815998872121175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,65536,0.07185173034667969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,10240,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,8192,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,6144,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,5120,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,7168,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,4096,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,3072,0.020754132668177286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,1024,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,768,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,64,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,65536,0.07246507008870443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,10240,0.02935466567675273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,8192,0.02874133388201396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,7168,0.02744320034980774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,6144,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,5120,0.0253930668036143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,4096,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,3072,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,2560,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,1536,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,1024,0.018294399976730345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,768,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,512,0.016450132926305136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,32,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,12288,0.21951252619425454
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,16384,0.27811733881632483
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,10240,0.16274773279825847
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,7168,0.11694186528523762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,6144,0.10315093199412029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,5120,0.09065813223520915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,4096,0.07744853496551514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,3584,0.06928959687550863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,3072,0.059495464960734046
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,2560,0.053350400924682614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,2048,0.04700053135553996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,1536,0.040889600912729904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,1024,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,768,0.03269973397254944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,512,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,256,0.02696640094121297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,128,0.02566933234532674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,64,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,32,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,65536,0.26033493677775066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,16384,0.08290987014770508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,12288,0.07045119603474935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,10240,0.06202026605606079
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,8192,0.05345173279444376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,7168,0.049561599890391037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,6144,0.04539733330408732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,5120,0.040958933035532635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,4096,0.03686399857203166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,3584,0.034542934099833174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,3072,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,2560,0.030105600754419964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,2048,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,1536,0.025462400913238526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,1024,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,768,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,512,0.019385600090026857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,256,0.019048533837000527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,128,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,64,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,16384,32,0.020683733622233073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,65536,0.19903146425882975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,16384,0.06574186484018961
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,12288,0.05809599955876669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,10240,0.051780267556508386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,8192,0.045533867677052815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,7168,0.0425983985265096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,2560,1024,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,6144,0.03891199827194214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,5120,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,4096,0.03283733328183492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,3584,0.030583467086156207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,3072,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,2560,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,2048,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,1536,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,1024,0.020718934138615926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,512,0.019799466927846274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,768,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,256,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,128,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,12288,32,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,16384,0.05946453412373861
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,12288,0.053010133902231846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,65536,0.21186559995015464
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,10240,0.04754773378372192
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,7168,0.03891306718190511
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,6144,0.03495146830876668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,5120,0.03283519943555196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,4096,0.02997013330459595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,3584,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,3072,0.027510400613149005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,2560,0.02635306715965271
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,2048,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,1536,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,1024,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,512,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,256,0.01775040030479431
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,32,0.017545600732167564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,65536,0.18452480634053547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,16384,0.05570666790008545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,12288,0.048844798405965166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,10240,0.0421887993812561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,8192,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,7168,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,6144,0.03283519943555196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,5120,0.030789333581924438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,4096,0.028398933013280232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,3584,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,3072,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,2560,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,2048,0.0211626668771108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,1536,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,768,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,512,0.01713599960009257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,256,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,8192,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,65536,0.16568320592244465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,16384,0.052121599515279136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,12288,0.0464906652768453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,10240,0.04068586826324463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,8192,0.035290666421254474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,7168,0.03331519961357117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,6144,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,5120,0.02955840031305949
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,4096,0.027306665976842243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,3584,0.02648746569951375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,3072,0.024985599517822265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,2560,0.022734934091567995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,2048,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,1536,0.019182932376861573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,768,0.017270400126775106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,256,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,128,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,7168,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,384,64,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,65536,0.14103892644246419
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,16384,0.04994026819864909
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,12288,0.04341866572697957
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,10240,0.039185067017873124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,8192,0.0348853349685669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,7168,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,6144,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,4096,0.027033599217732747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,5120,0.02935466567675273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,3584,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,3072,0.024577067295710246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,2560,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,2048,0.021501866976420085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,1536,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,1024,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,768,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,256,0.01699840029080709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,512,0.01761173407236735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,6144,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,16384,0.046284798781077066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,65536,0.1408352057139079
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,12288,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,10240,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,8192,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,7168,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,6144,0.029215999444325763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,65536,8192,0.1300821304321289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,5120,0.027782400449117024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,3584,0.02491733431816101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,2560,0.022116265694300332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,2048,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,768,0.018023467063903807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,5120,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,16384,0.04396373430887858
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,12288,0.03918613195419311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,65536,0.1113429307937622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,8192,0.03174399932225545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,10240,0.03590933481852214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,6144,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,5120,0.02737706700960795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,7168,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,4096,0.02532800038655599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,3584,0.02368853290875753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,3072,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,2560,0.0211626668771108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,1536,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,768,0.016926934321721397
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,512,0.016587733229001363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,4096,32,0.016472533345222473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,16384,0.040550398826599124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,65536,0.10973866780598958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,12288,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,10240,0.034542934099833174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,8192,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,7168,0.029285333553949994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,6144,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,5120,0.026691200335820515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,4096,0.02443839907646179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,3584,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,3072,0.021230934063593547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,2048,0.02068586746851603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,2560,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,1536,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,768,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,512,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3584,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,12288,0.036659200986226395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,16384,0.04205120007197062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,65536,0.10240000089009602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,10240,0.03297280073165894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,8192,0.03031253417332967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,7168,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,6144,0.026759467522303265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,3584,0.02286826570828756
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,2560,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,3072,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,2048,0.019933867454528808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,1024,0.01843413313229879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,512,0.016860800981521606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,128,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,3072,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,16384,0.04116586844126384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,12288,0.035021865367889406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,65536,0.09256959756215413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,10240,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,8192,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,6144,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,7168,0.027581866582234698
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,5120,0.02512213389078776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,4096,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,3072,0.020890667041142782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,3584,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,2048,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,1024,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,256,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,64,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2560,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,16384,0.03911573489507039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,12288,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,65536,0.08666453361511231
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,10240,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,7168,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,8192,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,6144,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,2048,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,1024,0.017475199699401856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,768,0.017339734236399333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,2048,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,16384,0.03713920116424561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,12288,0.03556693394978841
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,65536,0.08024746576944987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,10240,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,8192,0.027784534295399982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,7168,0.028535467386245728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,6144,0.026554665962855023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,4096,0.022779732942581177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,5120,0.02403093377749125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,3584,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,3072,0.020888533194859824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,2560,0.02048106590906779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,1024,0.01781546672185262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,512,0.01658986707528432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,128,0.016109866897265117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1536,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,16384,0.034953598181406656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,12288,0.032358400026957196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,65536,0.0731818675994873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,10240,8192,0.04130133390426636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,8192,0.026829866568247478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,7168,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,6144,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,5120,0.023143466313680014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,3584,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,3072,0.020600533485412596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,2560,0.020139733950297035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,2048,0.019592533508936562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,1536,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,1024,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,512,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,768,0.017746132612228394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,32,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,16384,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,65536,0.06959786415100097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,10240,0.029286400477091475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,7168,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,6144,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,3584,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,3072,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,2048,0.01966080069541931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,1024,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,768,0.017951999107996622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,256,0.016724266608556113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,64,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,768,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,16384,0.03283733328183492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,65536,0.06342080036799112
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,10240,0.028945066531499225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,7168,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,8192,0.026690133412679035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,5120,0.023757867018381753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,4096,0.022459733486175536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,3584,0.02074986696243286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,3072,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,2560,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,2048,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,1024,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,768,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,512,0.01699840029080709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,256,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,512,32,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,16384,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,65536,0.0612010677655538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,10240,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,7168,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,5120,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,3584,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,3072,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,2560,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,2048,0.019592533508936562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,1536,0.01802240014076233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,1024,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,768,0.017339734236399333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,256,0.016450132926305136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,256,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,16384,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,12288,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,65536,0.05597759882609049
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,10240,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,7168,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,5120,0.024574933449427287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,4096,0.02430400053660075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,3584,0.02095680038134257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,2560,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,2048,0.01863573392232259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,1536,0.01842986742655436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,1024,0.01795413295427958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,128,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,64,0.015292800466219583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,16384,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,65536,0.05355519851048788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,12288,0.028603732585906982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,7168,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,6144,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,4096,0.023893332481384276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,3072,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,2560,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,2048,0.018706132968266807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,1536,0.01775040030479431
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,1024,0.017199999094009398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,128,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,256,0.01583573321501414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,64,0.015268266201019287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,64,32,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,16384,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,65536,0.054100267092386876
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,12288,0.028535467386245728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,10240,0.02669546604156494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,8192,0.026419200499852497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,7168,0.026077866554260254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,4096,0.022730666399002075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,3584,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,2560,0.020139733950297035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,1024,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,128,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,64,0.016160000363985697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,32,32,0.01495039959748586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,16384,0.2393418629964193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,12288,0.18343253135681153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,10240,0.14124372800191243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,8192,0.12014933427174886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,6144,0.0942080020904541
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,7168,0.10584746996561686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,4096,0.07058773040771485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,5120,0.08181866804758707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,3072,0.0565226674079895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,3584,0.06174720128377279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,2048,0.04471466541290283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,2560,0.05085973342259725
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,1536,0.03911679983139038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,1024,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,768,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,512,0.028874667485555013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,256,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,128,0.02259413401285807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,64,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,65536,32,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,16384,0.08017919858296713
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,12288,0.06403413216272989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,65536,0.2414933363596598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,10240,0.0571722666422526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,8192,0.05079040129979452
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,7168,0.0454645315806071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,6144,0.04198293288548787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,4096,0.03433813254038493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,5120,0.037137067317962645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,3584,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,3072,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,2560,0.027893332640329997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,2048,0.026075732707977296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,1536,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,1024,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,768,0.019387733936309815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,256,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,16384,32,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,16384,0.06782293319702148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,65536,0.2096127986907959
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,12288,0.05587519804636637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,10240,0.05024533271789551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,8192,0.04341760079065959
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,7168,0.0392522652943929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,6144,0.035225598017374675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,5120,0.03269866704940796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,4096,0.03051519989967346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,3584,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,3072,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,2560,0.025396267573038738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,2048,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,1536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,1024,0.019934932390848793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,512,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,256,0.01795413295427958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,12288,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,16384,0.06717440287272135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,65536,0.1850015958150228
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,12288,0.05621653397878011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,10240,0.05010773340861002
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,8192,0.043281066417694095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,7168,0.039867734909057616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,6144,0.03686399857203166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,5120,0.03399680058161418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,4096,0.031402667363484696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,3584,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,3072,0.027033599217732747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,2560,0.02600853244463603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,2048,0.02341653307278951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,1536,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,512,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,256,0.018296533823013307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,128,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,10240,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,16384,0.05599466562271118
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,65536,0.1614517370859782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,12288,0.05253119866053263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,10240,0.04734186728795369
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,8192,0.04212053219477336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,7168,0.03304213285446167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,6144,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,5120,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,4096,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,3584,0.025804799795150758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,3072,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,2560,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,1536,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,768,0.017477333545684814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,512,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,256,0.017475199699401856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,128,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,8192,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,16384,0.05768533150355021
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,65536,0.13946986198425293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,12288,0.04881173372268677
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,10240,0.04700160026550293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,8192,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,7168,0.03269973397254944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,6144,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,5120,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,4096,0.02696533401807149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,3584,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,3072,0.024370133876800537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,2560,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,2048,0.021574399868647256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,1024,0.01938986579577128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,768,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,256,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,128,0.017407999436060587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,1024,10240,0.028806400299072266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,7168,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,16384,0.05174613396326701
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,12288,0.043280001481374106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,65536,0.12622506618499757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,10240,0.03891199827194214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,8192,0.03426986535390218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,5120,0.02826346755027771
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,6144,0.03031146725018819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,7168,0.031947733958562215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,4096,0.026625066995620728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,3584,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,3072,0.023963733514149984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,1024,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,1536,0.01904639999071757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,768,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,512,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,128,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,64,0.016428800423940022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,6144,32,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,16384,0.050587733586629234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,12288,0.04102720022201538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,65536,0.12192426522572834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,10240,0.03672746817270915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,8192,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,7168,0.03099306623140971
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,6144,0.02908160090446472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,5120,0.02737706700960795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,3584,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,4096,0.02635093331336975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,3072,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,2560,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,2048,0.01904319922129313
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,1024,0.018498132626215615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,768,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,5120,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,16384,0.04532906611760457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,12288,0.037138132254282634
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,65536,0.10448213418324788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,10240,0.034747731685638425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,7168,0.02887786626815796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,8192,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,6144,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,4096,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,2048,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,2560,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,768,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,4096,32,0.017407999436060587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,12288,0.03747733434041341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,16384,0.04939093192418416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,65536,0.09680213133494059
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,10240,0.034406399726867674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,8192,0.031062400341033934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,7168,0.029967999458312987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,6144,0.026555732885996504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,4096,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,3584,0.02225386699040731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,2048,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,2560,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,1024,0.01843093236287435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,768,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,256,0.0169322669506073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3584,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,16384,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,12288,0.033659732341766356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,256,128,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,65536,0.09089706738789877
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,10240,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,8192,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,7168,0.028535467386245728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,4096,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,6144,0.02648959954579671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,3584,0.02211946646372477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,3072,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,2560,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,1536,0.01854613423347473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,1024,0.017614932854970296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,3072,32,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,16384,0.0413696010907491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,12288,0.03310933311780294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,65536,0.08584533532460531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,8192,0.029286400477091475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,7168,0.026898133754730224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,6144,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,5120,0.023826134204864503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,3584,0.021163733800252278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,3072,0.021028266350428263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,2560,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,2048,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,1024,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,768,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,128,0.0164490669965744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2560,32,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,16384,0.03878506819407145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,10240,0.03072106639544169
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,65536,0.07823359966278076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,12288,0.03263360063234965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,8192,0.027033599217732747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,7168,0.02621440092722575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,6144,0.02655679980913798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,5120,0.022459733486175536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,2048,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,2560,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,1024,0.01699733336766561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,256,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,128,0.016794667641321818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,64,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,2048,32,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,12288,0.03276906609535217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,65536,0.07314666906992594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,8192,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,10240,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,7168,0.025441066424051924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,5120,0.022529067595799764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,4096,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,2048,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,1024,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,512,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,256,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1536,128,0.01624853312969208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,65536,0.06475093364715576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,16384,0.034543999036153156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,10240,0.0277834673722585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,8192,0.02648746569951375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,3584,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,4096,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,3072,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,1536,0.018569600582122803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,2048,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,1024,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,16384,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,10240,0.02867199977238973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,12288,0.031129600604375203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,65536,0.05809599955876669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,6144,0.023689599831899007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,7168,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,5120,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,4096,0.02198186715443929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,3072,0.01918399930000305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,32,0.016587733229001363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,768,64,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,16384,0.031062400341033934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,65536,0.059630934397379556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,12288,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,8192,0.026349866390228273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,6144,0.023209599653879802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,4096,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,5120,0.02211839954058329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,3584,0.02068159977595011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,2560,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,1024,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,256,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,128,0.015415466825167336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,64,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,512,32,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,65536,0.0505184014638265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,10240,0.02682773272196452
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,16384,0.02908160090446472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,12288,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,7168,0.026077866554260254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,5120,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,4096,0.021504000822703043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,3584,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,3072,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,2048,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,1024,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,256,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,128,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,256,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,16384,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,65536,0.04932159980138143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,12288,0.028056534131368
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,8192,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,10240,0.026419200499852497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,7168,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,6144,0.024372265736262003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,5120,0.02327893376350403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,4096,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,3072,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,2560,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,1024,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,512,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,256,0.016908800601959227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,128,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,65536,0.04724053144454956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,10240,0.026691200335820515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,12288,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,16384,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,7168,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,6144,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,5120,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,3072,0.019662932554880778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,2560,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,2048,0.018631466229756675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,1024,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,128,0.0159061332543691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,64,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,64,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,16384,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,12288,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,10240,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,65536,0.045124268531799315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,8192,0.02430400053660075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,6144,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,3072,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,2048,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,2560,0.018569600582122803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,1024,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,64,0.01495039959748586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,192,32,32,0.017139200369517008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,12288,0.16165547370910643
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,16384,0.21213760375976562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,8192,0.11842880249023438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,10240,0.14507199923197428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,5120,0.08232959906260172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,6144,0.09495680332183838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,4096,0.06987093289693197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,7168,0.10712107022603352
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,3072,0.05768533150355021
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,3584,0.06307946840922038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,2560,0.04990293184916179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,2048,0.04375893274943034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,1024,0.031129600604375203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,768,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,1536,0.03898133436838786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,512,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,256,0.023552000522613525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,64,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,128,0.021572266022364298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,65536,32,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,12288,0.062326399485270176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,16384,0.07833279768625895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,10240,0.0550922671953837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,7168,0.04526079893112182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,8192,0.048059733708699544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,65536,0.2456223964691162
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,6144,0.040550398826599124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,5120,0.037478399276733396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,4096,0.03297173380851746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,3584,0.030789333581924438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,1536,0.023756800095240276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,2560,0.02730773289998372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,2048,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,3072,0.028945066531499225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,1024,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,768,0.01993280053138733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,512,0.01843093236287435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,256,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,128,0.01801919937133789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,64,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,16384,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,16384,0.06478399833043416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,12288,0.053521064917246494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,10240,0.04713600079218547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,65536,0.1922730604807536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,8192,0.04181333382924397
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,7168,0.03863893349965413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,6144,0.03509013255437215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,4096,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,3584,0.02874133388201396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,3072,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,5120,0.03174506624539693
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,2560,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,2048,0.02450666626294454
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,1024,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,64,0.018946133057276406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,12288,32,0.018373332420984902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,12288,0.05331626733144125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,10240,0.04686400095621745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,16384,0.06532693306605021
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,65536,0.17967467308044432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,8192,0.04451093276341756
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,7168,0.03686399857203166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,6144,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,5120,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,4096,0.028603732585906982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,3584,0.027989333868026732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,2560,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,3072,0.025257599353790284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,2048,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,1536,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,512,0.018091734250386557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,256,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,32,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,10240,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,16384,0.05120000044504801
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,12288,0.043178665637969973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,65536,0.1469098726908366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,10240,0.03884479999542236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,8192,0.03331413269042969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,7168,0.032358400026957196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,6144,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,5120,0.02778559923171997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,3584,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,4096,0.026077866554260254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,3072,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,2048,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,1024,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,512,0.017064533631006875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,128,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,768,0.01665493349234263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,8192,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,16384,0.04986879825592041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,12288,0.04150506655375163
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,10240,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,65536,0.133187198638916
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,8192,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,7168,0.03133440017700195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,5120,0.028670932849248248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,6144,0.029012266794840497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,3584,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,4096,0.02573653260866801
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,3072,0.023959465821584067
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,2560,0.021913599967956544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,2048,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,1024,0.019113600254058838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,768,0.018023467063903807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,1536,0.020275199413299562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,512,0.01802240014076233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,256,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,128,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,64,0.016463999946912132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,7168,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,16384,0.05092693169911703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,10240,0.037614933649698895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,12288,0.041368532180786136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,65536,0.11936426957448323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,8192,0.03290560046831767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,7168,0.031471999486287434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,5120,0.028670932849248248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,6144,0.02887786626815796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,4096,0.026147200663884478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,3584,0.02485226591428121
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,3072,0.024166399240493776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,2560,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,2048,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,768,0.01754666765530904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,256,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,12288,0.040686933199564616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,16384,0.048878931999206544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,65536,0.11246720155080159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,10240,0.036865067481994626
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,8192,0.032631466786066696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,7168,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,6144,0.02969493269920349
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,4096,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,5120,0.026829866568247478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,3584,0.024098134040832518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,2048,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,768,0.01699840029080709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,128,0.01590506633122762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,5120,32,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,12288,0.034065067768096924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,16384,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,65536,0.0984394629796346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,10240,0.03126506606737773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,8192,0.02874133388201396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,7168,0.026897066831588747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,6144,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,5120,0.02450666626294454
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,3584,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,3072,0.020275199413299562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,2560,0.01966080069541931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,1024,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,256,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,128,0.016179200013478598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,4096,64,0.01644373337427775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,16384,0.042530135313669844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,65536,0.08915627002716064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,12288,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,10240,0.031540266672770184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,8192,0.030105600754419964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,7168,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,6144,0.02539520064989726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,5120,0.024235733350118003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,4096,0.021297067403793335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,3584,0.021022933721542358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,3072,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,2560,0.018569600582122803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,2048,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,1536,0.017679999272028603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,1024,0.017681066195170084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,512,0.016658133268356322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,128,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3584,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,16384,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,12288,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,65536,0.08427519798278808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,8192,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,7168,0.027514666318893433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,10240,0.03140053351720174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,6144,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,4096,0.02300693392753601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,2560,0.019113600254058838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,2048,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,1024,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,64,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,3072,32,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,16384,0.038024532794952395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,12288,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,65536,0.07877973715464273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,8192,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,7168,0.02730773289998372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,6144,0.024984532594680788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,5120,0.024098134040832518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,4096,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,3584,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,3072,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,2560,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,2048,0.018979199727376304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,1536,0.018295466899871826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,512,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,256,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,16384,0.03645439942677815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,65536,0.07147520383199056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,12288,0.03317653338114421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,8192,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,7168,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,6144,0.024371200799942018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,4096,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,2048,0.01884053349494934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,512,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,64,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2048,32,0.016593066851298015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,65536,0.065774933497111
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,16384,0.036931200822194414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,10240,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,12288,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,6144,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,4096,0.020754132668177286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,3584,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,2560,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,2048,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,1536,0.017204266786575318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,1024,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,768,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,512,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,256,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1536,32,0.01648853321870168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,16384,0.034747731685638425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,65536,0.05761706829071045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,12288,0.030446932713190718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,10240,0.027989333868026732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,8192,0.03051519989967346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,7168,0.026691200335820515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,6144,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,5120,0.024371200799942018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,4096,0.02368853290875753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,3584,0.020278400182723998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,3072,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,2560,0.01863573392232259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,1536,0.017131733894348144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,1024,0.018091734250386557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,256,0.016109866897265117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,128,0.016497066617012023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,1024,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,65536,0.05836799939473471
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,16384,0.03283733328183492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,10240,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,6144,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,5120,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,2560,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,2048,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,1024,0.01699626644452413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,65536,0.053179732958475744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,16384,0.030583467086156207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,12288,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,8192,0.02621440092722575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,6144,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,3072,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,2560,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,1536,0.01781760056813558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,1024,0.01699840029080709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,512,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,65536,0.048706134160359696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,16384,0.032494932413101196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,12288,0.027374933163324993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,10240,0.026899200677871705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,4096,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,3072,0.01966080069541931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,2560,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,1536,0.01781760056813558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,1024,0.01713493267695109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,768,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,64,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,256,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,65536,0.04741119941075643
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,16384,0.029491200049718218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,6144,1536,0.01972800095876058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,12288,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,10240,0.026077866554260254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,8192,0.02519039909044902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,7168,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,5120,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,6144,0.02334933280944824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,3072,0.01911466717720032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,2560,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,2048,0.0185973326365153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,1536,0.017885865767796834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,512,0.01658986707528432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,128,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,64,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,128,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,65536,0.045124268531799315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,16384,0.028602667649586994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,12288,0.02635093331336975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,3072,0.019798400004704793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,768,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,64,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,65536,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,16384,0.028603732585906982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,12288,0.026213334004084272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,8192,0.02443839907646179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,7168,0.024098134040832518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,4096,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,3584,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,3072,0.019385600090026857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,2560,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,2048,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,1536,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,1024,0.017612799008687337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,2560,10240,0.030718932549158733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,256,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,32,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,16384,0.2154154618581136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,12288,0.1657514731089274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,10240,0.1416533311208089
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,8192,0.11892159779866536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,7168,0.10547306537628173
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,6144,0.09294613202412924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,5120,0.08178559939066568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,4096,0.06987093289693197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,3584,0.06242986520131429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,3072,0.05601173241933187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,2560,0.05034666856129964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,1536,0.03850239912668864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,2048,0.043281066417694095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,1024,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,768,0.027236266930898027
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,512,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,256,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,128,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,32,0.023139200607935586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,65536,64,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,16384,0.07509333292643229
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,65536,0.2433717409769694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,12288,0.06143893400828043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,10240,0.05379413366317749
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,8192,0.04686506589253743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,7168,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,6144,0.037273601690928145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,5120,0.03331413269042969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,4096,0.029285333553949994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,3584,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,2560,0.025051732858022053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,3072,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,2048,0.02430293361345927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,1536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,1024,0.019387733936309815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,512,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,128,0.01679253379503886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,256,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,16384,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,16384,0.06133759816487631
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,65536,0.1913856029510498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,12288,0.051064534982045495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,10240,0.045670398076375324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,8192,0.039937067031860354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,7168,0.035225598017374675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,5120,0.02983040014902751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,6144,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,4096,0.027988266944885255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,3584,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,3072,0.02539520064989726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,2560,0.024098134040832518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,2048,0.023487999041875204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,1536,0.020275199413299562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,512,0.017681066195170084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,768,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,256,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,64,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,768,12288,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,12288,32,0.017145599921544394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,16384,0.05468266805013021
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,12288,0.046078932285308835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,65536,0.15305387179056804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,10240,0.04123306671778361
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,7168,0.03276906609535217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,8192,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,6144,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,5120,0.027513599395751952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,4096,0.02614186604817708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,3584,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,3072,0.024577067295710246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,1536,0.01911466717720032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,2048,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,768,0.01775146722793579
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,1024,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,256,0.017407999436060587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,10240,32,0.01699840029080709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,16384,0.049459199110666915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,12288,0.04211733341217041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,65536,0.1321301301320394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,8192,0.03317653338114421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,10240,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,7168,0.03051626682281494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,6144,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,4096,0.02491733431816101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,5120,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,3584,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,2560,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,2048,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,768,0.017612799008687337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,1024,0.017889066537221273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,256,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,8192,32,0.017407999436060587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,16384,0.04430506626764934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,12288,0.03809279998143514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,65536,0.1349290688832601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,10240,0.034405334790547686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,8192,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,7168,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,6144,0.026761599381764728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,5120,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,3584,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,3072,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,4096,0.024370133876800537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,2048,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,1536,0.018225065867106118
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,1024,0.017819732427597046
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,32,0.017132800817489625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,7168,64,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,16384,0.0425983985265096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,65536,0.10912533601125081
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,12288,0.03515733480453491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,10240,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,8192,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,7168,0.028602667649586994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,6144,0.026897066831588747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,4096,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,3584,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,3072,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,2048,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,2560,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,1024,0.01781866749127706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,512,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,256,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,128,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,6144,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,12288,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,16384,0.04546240170796712
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,65536,0.09735039869944254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,10240,0.03174293239911397
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,7168,0.026897066831588747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,8192,0.028742400805155437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,6144,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,3072,0.018977065881093345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,2560,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,2048,0.018567466735839845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,1536,0.017410133282343546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,768,0.016862932840983072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,1024,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,256,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,5120,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,16384,0.040072532494862874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,12288,0.032849067449569704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,65536,0.08983893394470215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,10240,0.029762132962544756
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,8192,0.027715200185775758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,7168,0.026554665962855023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,5120,0.024370133876800537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,6144,0.02553173303604126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,3584,0.021707733472188316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,3072,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,4096,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,2560,0.01877546707789103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,1536,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,1024,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,4096,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,65536,0.08256746927897135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,16384,0.03843413194020589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,12288,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,8192,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,10240,0.02921813329060872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,7168,0.026555732885996504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,6144,0.025259733200073242
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,5120,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,4096,0.020820266008377074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,3584,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,3072,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,2048,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,2560,0.018569600582122803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,1024,0.01720213294029236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,256,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,128,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3584,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,16384,0.037478399276733396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,12288,0.031196800867716472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,65536,0.07598293622334798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,10240,0.029419734080632524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,7168,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,6144,0.024577067295710246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,5120,0.02136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,4096,0.02068586746851603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,3072,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,2560,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,1024,0.017267199357350667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,160,64,6144,0.02423680027325948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,512,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,256,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,64,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,3072,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,65536,0.07191999753316244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,10240,0.031405866146087646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,12288,0.03269760012626648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,6144,0.0228000005086263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,5120,0.022256000836690267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,4096,0.020617600282033285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,3584,0.02027626633644104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,3072,0.019182932376861573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,2560,0.019182932376861573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,1024,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,128,0.016246400276819863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,16384,0.03358506759007772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,65536,0.06355413198471069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,10240,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,7168,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,8192,0.02587413390477498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,6144,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,5120,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,4096,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,3072,0.018637865781784058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,2048,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,2560,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,1024,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,256,0.016658133268356322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,64,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,128,0.015220266580581666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,16384,0.030923734108606975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,65536,0.05761706829071045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,12288,0.029422932863235475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,10240,0.02757973273595174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,8192,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,7168,0.022936532894770302
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,5120,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,2560,0.018637865781784058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,2048,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,128,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,64,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1536,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,16384,0.03099306623140971
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,65536,0.0501749316851298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,12288,0.028535467386245728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,8192,0.024918399254480996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,7168,0.023552000522613525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,5120,0.021708800395329794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,4096,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,3584,0.01952426632245382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,1024,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,128,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,256,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,1024,32,0.014811733365058899
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,65536,0.04775360027949015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,16384,0.02867199977238973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,12288,0.02696640094121297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,8192,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,7168,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,5120,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,4096,0.020206934213638304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,3584,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,1536,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,2048,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,1024,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,256,0.01651946703592936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,128,0.016658133268356322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,768,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,65536,0.043212799231211345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,16384,0.027989333868026732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,12288,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,10240,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,7168,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,3584,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,2048,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,512,0.01693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,256,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,128,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,65536,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,16384,0.02696533401807149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,12288,0.025617067019144697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,10240,0.025326933463414508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,7168,0.024029866854349772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,6144,0.02259413401285807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,5120,0.022116265694300332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,4096,0.020888533194859824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,3584,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,2560,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,2048,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,128,0.015291733543078103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,256,32,0.015289599696795145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,65536,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,16384,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,10240,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,8192,0.02355413238207499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,7168,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,5120,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,4096,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,3584,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,3072,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,2560,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,2048,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,1536,0.01699840029080709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,256,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,128,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,128,32,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,65536,0.0370688001314799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,16384,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,12288,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,10240,0.023963733514149984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,7168,0.022731733322143555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,5120,0.0217738668123881
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,4096,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,3584,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,2560,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,2048,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,1536,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,512,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,128,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,64,32,0.014405333002408347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,65536,0.038024532794952395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,16384,0.02648746569951375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,10240,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,8192,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2560,7168,0.025326933463414508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,7168,0.022665599981943764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,4096,0.021844265858332317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,5120,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,3584,0.020071466763814293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,2048,0.017953066031138103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,1536,0.018091734250386557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,128,0.016426666577657064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,32,32,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,12288,0.16377280553181967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,16384,0.21078079541524253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,2048,512,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,10240,0.12742079893747965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,8192,0.10724799633026123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,7168,0.09533440272013347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,6144,0.08530240058898926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,4096,0.06492053270339966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,5120,0.07434346675872802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,3584,0.05785813331604004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,3072,0.05270293156305948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,2560,0.04713813463846843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,2048,0.041915734608968094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,1536,0.0351583997408549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,1024,0.029013333717981975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,768,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,512,0.02409706711769104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,128,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,256,0.022051199277242025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,64,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,65536,32,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,16384,0.06720960140228271
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,12288,0.05522773265838623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,65536,0.21562132835388184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,10240,0.049582934379577635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,8192,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,6144,0.03597653309504191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,7168,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,5120,0.03297280073165894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,4096,0.029148799180984498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,3072,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,3584,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,2048,0.024235733350118003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,2560,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,1536,0.021505065759023032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,768,0.01761173407236735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,256,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,16384,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,16384,0.06055253346761068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,65536,0.16923306783040365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,12288,0.04908373355865479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,10240,0.045057066281636554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,8192,0.03870613177617391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,7168,0.03515626589457194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,6144,0.03310933311780294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,5120,0.02921813329060872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,4096,0.02744213342666626
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,3584,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,3072,0.02553173303604126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,2048,0.023552000522613525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,2560,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,1536,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,768,0.01788160006205241
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,512,0.017475199699401856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,256,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,12288,32,0.01717546582221985
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,12288,0.04532800118128459
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,16384,0.05348693529764811
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,65536,0.15694506963094074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,10240,0.04082346757253011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,8192,0.03515733480453491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,7168,0.031470932563145954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,6144,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,4096,0.02621440092722575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,5120,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,3584,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,3072,0.024165334304173787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,2560,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,2048,0.021913599967956544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,1536,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,512,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,64,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,10240,32,0.016500266393025716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,16384,0.04768426815668742
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,12288,0.04041386842727661
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,65536,0.1316864013671875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,10240,0.03563520113627116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,8192,0.032631466786066696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,7168,0.029764266808827718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,5120,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,6144,0.027373866240183516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,3584,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,4096,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,128,512,4096,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,2560,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,2048,0.019592533508936562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,1536,0.017885865767796834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,1024,0.017409066359202065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,768,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,8192,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,16384,0.045875199635823566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,10240,0.03440746863683065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,65536,0.11738453706105549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,8192,0.030857600768407184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,7168,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,6144,0.026898133754730224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,5120,0.026691200335820515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,4096,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,3072,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,3584,0.02389226754506429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,2048,0.019387733936309815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,1024,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,1536,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,768,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,128,0.016477866967519125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,64,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,16384,0.04485119978586833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,65536,0.10441386699676514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,12288,0.03563520113627116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,10240,0.03283519943555196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,8192,0.02996586759885152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,5120,0.02553173303604126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,7168,0.028193066517512005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,6144,0.026691200335820515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,4096,0.023961599667867026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,3072,0.02211839954058329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,3584,0.02177813251813253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,1024,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,512,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,128,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,6144,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,65536,0.09704106648763021
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,16384,0.04355306625366211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,12288,0.03283733328183492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,8192,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,10240,0.02990079919497172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,7168,0.02683093349138896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,6144,0.02648746569951375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,5120,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,3584,0.022050132354100548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,2560,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,1536,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,2048,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,1024,0.018092799186706542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,128,0.015703466534614564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,32,0.016732800006866454
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,5120,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,16384,0.039389868577321366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,65536,0.08461653391520182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,12288,0.0339957316716512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,10240,0.028943999608357744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,7168,0.02512213389078776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,5120,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,3072,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,2048,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,1536,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,1024,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,512,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,256,0.017340799172719322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,128,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,4096,32,0.016501333316167197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,12288,0.03461120128631592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,65536,0.07707306543986002
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,16384,0.037478399276733396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,10240,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,7168,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,6144,0.025942399104436235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,5120,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,4096,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,3584,0.020206934213638304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,1536,0.01713493267695109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,1024,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,512,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,256,0.016587733229001363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3584,32,0.016858667135238647
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,12288,0.03051519989967346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,65536,0.07202133337656656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,16384,0.034270934263865155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,10240,0.02839999993642171
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,8192,0.02648746569951375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,7168,0.02491733431816101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,6144,0.02450559933980306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,5120,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,4096,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,3584,0.020275199413299562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,3072,0.01884373426437378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,2048,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,2560,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,1536,0.01658986707528432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,1024,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,128,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,3072,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,12288,0.02996693253517151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,16384,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,65536,0.06717440287272135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,10240,0.027988266944885255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,8192,0.02546773354212443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,6144,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,5120,0.02116159995396932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,4096,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,3584,0.01952426632245382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,1536,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,1024,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,128,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2560,32,0.0164874662955602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,12288,0.03065173427263896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,16384,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,65536,0.06048426628112793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,10240,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,7168,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,8192,0.026897066831588747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,6144,0.0228000005086263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,5120,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,3584,0.01952426632245382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,2048,0.01843093236287435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,2560,0.018294399976730345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,1024,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,512,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,256,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,128,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,64,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,2048,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,16384,0.03126613299051921
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,12288,0.028398933013280232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,65536,0.05529599984486898
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,8192,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,10240,0.02696320017178853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,6144,0.02218773365020752
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,3584,0.01986773411432902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,4096,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,2048,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,1536,0.01665493349234263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,1024,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,256,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,32,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1536,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,16384,0.029556266466776532
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,65536,0.05150613387425741
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,12288,0.028194133440653486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,10240,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,8192,0.02491733431816101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,7168,0.022459733486175536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,6144,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,3072,0.019385600090026857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,1536,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,512,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,128,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,1024,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,16384,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,65536,0.04635200103123983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,12288,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,10240,0.026625066995620728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,7168,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,6144,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,3584,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,2048,0.018295466899871826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,1024,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,768,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,512,0.015768532951672874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,256,0.016566399733225504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,128,0.015359999736150107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,32,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,768,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,16384,0.02826346755027771
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,65536,0.042055467764536544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,8192,0.022662399212519328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,7168,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,6144,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,5120,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,3584,0.01877546707789103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,4096,0.019115734100341796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,2048,0.017547732591629027
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,1024,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,512,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,512,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,65536,0.040550398826599124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,16384,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,8192,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,5120,0.021708800395329794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,4096,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,3584,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,2048,0.017816533644994102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,2560,0.018228266636530557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,1024,0.01665493349234263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,256,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,128,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,256,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,65536,0.03734079996744792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,16384,0.02621440092722575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,12288,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,8192,0.02300800085067749
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,10240,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,6144,0.02225066622098287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,5120,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,3584,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,2048,0.017885865767796834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,1024,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,512,0.015359999736150107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,256,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,128,64,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,65536,0.03502080043156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,16384,0.02539520064989726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,12288,0.024099200963974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,10240,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,6144,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,5120,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,3584,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,4096,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,2048,0.01802240014076233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,128,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,32,0.015270400047302245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,64,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,65536,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,16384,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,12288,0.024233599503835045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,8192,0.02245866656303406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,10240,0.022665599981943764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,7168,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,6144,0.02232426603635152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,5120,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,3584,0.01884053349494934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,2048,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,1024,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,512,0.01576959987481435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,256,0.016179200013478598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,128,0.014405333002408347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,32,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,16384,0.20469759305318197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,12288,0.15872000058492025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,10240,0.12773653666178386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,7168,0.09448106288909912
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,8192,0.10734933217366535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,6144,0.08388906319936117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,4096,0.06376106739044189
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,5120,0.07383039792378744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,3584,0.057036801179250085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,2560,0.04689600070317586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,3072,0.052293332417805996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,96,7168,12288,0.038365864753723146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,2048,0.04109653234481812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,1536,0.0360479990641276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,1024,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,768,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,512,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,256,0.021505065759023032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,128,0.020617600282033285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,64,0.021095466613769532
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,65536,32,0.021572266022364298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,16384,0.06365866661071777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,12288,0.053452801704406736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,65536,0.21555306116739908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,10240,0.04713706572850545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,7168,0.03890026807785034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,8192,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,6144,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,4096,0.02904213269551595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,3584,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,5120,0.031061333417892457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,3072,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,2560,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,1536,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,1024,0.01904639999071757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,768,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,128,0.01651946703592936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,64,0.017757866779963175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,16384,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,16384,0.059631999333699545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,12288,0.04922026793162028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,10240,0.043212799231211345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,65536,0.16950613657633465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,8192,0.03836479981740316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,7168,0.03604480028152466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,6144,0.032153600454330446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,4096,0.02757866581281026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,3584,0.026782933870951337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,5120,0.02908160090446472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,3072,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,2560,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,2048,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,1024,0.018228266636530557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,1536,0.020205867290496827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,768,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,512,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,64,0.017065600554148356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,12288,32,0.016500266393025716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,12288,0.044100264708201095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,10240,0.04034666617711385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,16384,0.05259946584701538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,65536,0.15380373001098632
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,8192,0.034679468472798666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,7168,0.033111466964085894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,5120,0.02696533401807149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,6144,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,4096,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,3584,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,3072,0.023756800095240276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,1536,0.01911466717720032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,1024,0.01843093236287435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,512,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,768,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,256,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,10240,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,16384,0.04532800118128459
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,65536,0.12960426807403563
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,12288,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,10240,0.03515733480453491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,8192,0.030789333581924438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,6144,0.027784534295399982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,7168,0.029901866118113202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,5120,0.026419200499852497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,3584,0.02368853290875753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,3072,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,4096,0.023893332481384276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,2048,0.019386667013168334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,1536,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,1024,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,768,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,8192,32,0.016638933618863424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,12288,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,65536,0.11223039627075196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,16384,0.04450986782709758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,8192,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,7168,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,6144,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,5120,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,4096,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,3072,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,2560,0.019182932376861573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,1536,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,1024,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,768,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,256,0.016177067160606386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,128,0.017681066195170084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,16384,0.04403520027796427
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,65536,0.09797546863555909
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,12288,0.03481920162836711
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,10240,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,8192,0.02887786626815796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,7168,0.028603732585906982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,5120,0.024985599517822265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,6144,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,4096,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,3584,0.023075199127197264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,2048,0.0197269340356191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,2560,0.021434666713078816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,1024,0.01692906618118286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,128,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,64,0.01604373355706533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,6144,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,12288,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,65536,0.09099946816762289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,16384,0.040958933035532635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,10240,0.032085333267847696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,8192,0.027512532472610474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,7168,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,6144,0.02662293314933777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,3072,0.020754132668177286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,2048,0.020002132654190062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,1536,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,1024,0.01761066714922587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,768,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,64,0.0159061332543691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,128,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,5120,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,12288,0.0336575984954834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,16384,0.037887998421986896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,65536,0.07956480185190837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,10240,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,8192,0.026283733050028485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,6144,0.02430400053660075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,5120,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,3584,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,2560,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,1536,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,768,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,256,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,512,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,128,0.015837867061297098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,16384,0.036659200986226395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,65536,0.0717141310373942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,12288,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,10240,0.03276693423589071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,8192,0.02491733431816101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,7168,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,6144,0.02430293361345927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,5120,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,3584,0.018637865781784058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,2048,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,2560,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,1536,0.016450132926305136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,512,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,256,0.01576959987481435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,128,0.015225600202878317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,64,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3584,32,0.015224533279736838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,65536,0.06744639873504639
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,16384,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,12288,0.02969599962234497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,10240,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,6144,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,7168,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,5120,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,3584,0.01883946657180786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,2048,0.01658986707528432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,64,0.015634133418401083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,3072,32,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,16384,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,65536,0.06140586535135904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,12288,0.02935466567675273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,10240,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,8192,0.02499306599299113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,7168,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,6144,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,5120,0.02068586746851603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,4096,0.01966080069541931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,2048,0.016659200191497803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,1536,0.01658986707528432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,256,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,128,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2560,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,65536,0.05744640032450358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,16384,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,10240,0.027034666140874224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,8192,0.025461333990097045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,7168,0.02621440092722575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,6144,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,4096,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,5120,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,3584,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,3072,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,2048,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,512,0.015631999572118124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,256,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,128,0.015495466192563376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,2048,32,0.015634133418401083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,65536,0.051336534818013514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,16384,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,12288,0.028058665990829467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,8192,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,6144,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,4096,0.018702934185663857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,3584,0.018706132968266807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,2560,0.017612799008687337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,2048,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,768,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,256,0.015837867061297098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,64,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1536,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,65536,0.048468267917633055
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,16384,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,12288,0.027033599217732747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,7168,0.022529067595799764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,3584,0.018844799200693766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,3072,0.01904639999071757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,2560,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,2048,0.01795519987742106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,1536,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,256,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,512,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,64,0.015291733543078103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,1024,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,65536,0.042871467272440594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,16384,0.03031040032704671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,10240,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,12288,0.026077866554260254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,7168,0.022117332617441813
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,6144,0.020682666699091592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,5120,0.020426666736602782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,4096,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,3584,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,2560,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,2048,0.01802240014076233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,256,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,64,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,768,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,65536,0.03986666599909465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,16384,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,8192,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,6144,0.020615466435750327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,7168,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,5120,0.02034453352292379
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,4096,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,3584,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,2048,0.017681066195170084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,1536,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,128,0.01597546637058258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,512,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,65536,0.03877653280893962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,16384,0.025803732872009277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,12288,0.024848000208536784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,8192,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,6144,0.02211839954058329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,5120,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,2048,0.01781866749127706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,2560,0.01781546672185262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,7168,10240,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,256,0.0159061332543691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,64,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,256,32,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,65536,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,16384,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,10240,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,8192,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,5120,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,6144,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,4096,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,3072,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,512,0.014938666423161825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,64,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,128,32,0.014405333002408347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,65536,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,16384,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,12288,0.022938666741053264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,10240,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,8192,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,5120,0.02198186715443929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,7168,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,3584,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,4096,0.01986560026804606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,2048,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,768,0.016179200013478598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,256,0.016587733229001363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,512,0.015564800302187601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,128,0.014406399925549826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,64,32,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,65536,0.03413333495457967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,16384,0.02519039909044902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,10240,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,12288,0.022662399212519328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,7168,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,6144,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,5120,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,4096,0.020275199413299562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,2560,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,2048,0.018478933970133463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,1536,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,768,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,512,0.015836800138155617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,128,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,64,0.014745600024859109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,32,32,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,80,4096,2048,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,16384,0.20319786071777343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,12288,0.15482880274454752
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,8192,0.11119786898295085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,10240,0.13219733238220216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,7168,0.0991925319035848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,6144,0.08683306376139323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,5120,0.07751359939575195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,4096,0.06966613133748373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,3584,0.06079146862030029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,2560,0.048913065592447916
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,3072,0.05438506603240967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,2048,0.043622398376464845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,1536,0.037137067317962645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,1024,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,768,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,256,0.018910932540893554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,512,0.023552000522613525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,128,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,64,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,65536,32,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,16384,0.06331733465194703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,12288,0.05157333215077718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,10240,0.04676266511281331
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,8192,0.040003200372060135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,7168,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,65536,0.21484266916910805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,6144,0.03502080043156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,5120,0.03099306623140971
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,4096,0.027716267108917236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,3584,0.02648746569951375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,3072,0.02635093331336975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,2560,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,768,0.017683200041453042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,256,0.016497066617012023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,64,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,16384,32,0.017988266547520955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,16384,0.053384534517923986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,10240,0.040209066867828366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,12288,0.04491946697235107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,65536,0.1619274616241455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,8192,0.03529493411382039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,7168,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,6144,0.03072106639544169
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,5120,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,3584,0.02539520064989726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,2560,0.023959465821584067
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,3072,0.02368853290875753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,1536,0.019387733936309815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,512,0.017522132396697997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,128,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,12288,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,16384,0.04799253145853678
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,12288,0.04163946708043416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,65536,0.14885759353637695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,10240,0.03645439942677815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,8192,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,7168,0.03089173237482707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,6144,0.028467200199762982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,4096,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,5120,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,3584,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,3072,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,2048,0.019182932376861573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,1024,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,768,0.017386666933695474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,128,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,256,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,32,0.01683093309402466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,10240,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,12288,0.03659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,10240,0.03297066688537598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,16384,0.04171200195948283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,65536,0.1240063985188802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,8192,0.02956053415934245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,7168,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,6144,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,5120,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,3584,0.023277866840362548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,4096,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,2560,0.020617600282033285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,1536,0.01836479902267456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,2048,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,768,0.01672640045483907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,256,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,128,0.01644373337427775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,32,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,8192,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,16384,0.04526079893112182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,65536,0.10919253031412761
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,12288,0.03502080043156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,10240,0.03126613299051921
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,8192,0.028522666295369464
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,7168,0.02723840077718099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,6144,0.02635093331336975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,4096,0.02300693392753601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,3072,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,1024,0.017338667313257852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,2560,0.018567466735839845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,768,0.017409066359202065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,7168,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,65536,0.09410560131072998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,16384,0.04307733376820882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,12288,0.037546666463216145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,10240,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,8192,0.027646932999293012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,5120,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,6144,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,7168,0.02573546568552653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,3584,0.02109653353691101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,4096,0.02143359978993734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,1536,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,128,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,6144,64,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,16384,0.03945706685384114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,65536,0.08683413664499919
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,12288,0.0348853349685669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,8192,0.026555732885996504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,10240,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,7168,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,6144,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,5120,0.022733867168426514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,4096,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,3072,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,1536,0.01700053413709005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,2048,0.018092799186706542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,256,0.016385066509246825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,128,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,16384,0.03461120128631592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,65536,0.07481813430786133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,10240,0.028124799331029255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,12288,0.02922133406003316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,8192,0.024985599517822265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,7168,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,6144,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,5120,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,4096,0.021230934063593547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,3072,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,3584,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,2048,0.0169322669506073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,1024,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,768,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,256,0.016500266393025716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,512,0.01604373355706533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,64,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,4096,32,0.015220266580581666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,16384,0.03413333495457967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,65536,0.06840319633483886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,12288,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,8192,0.025259733200073242
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,7168,0.023619200785954794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,4096,0.0192522664864858
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,5120,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,3072,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,2560,0.017678932348887125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,2048,0.01679146687189738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,1536,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,256,0.016247466206550598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,128,0.01644159952799479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,16384,0.03385813236236572
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,65536,0.06502399841944376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,10240,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,7168,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,6144,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,4096,0.019592533508936562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,3072,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,3584,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,2560,0.017748266458511353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,2048,0.01713493267695109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,1536,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,256,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3072,32,0.016247466206550598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,65536,0.05850559870402018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,16384,0.03290346662203471
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,10240,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,12288,0.029422932863235475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,7168,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,6144,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,5120,0.020412800709406535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,4096,0.01911466717720032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,2048,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,2560,0.017273600896199545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2560,32,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,65536,0.051268267631530764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,16384,0.030105600754419964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,12288,0.028601600726445513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,10240,0.025602134068806966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,7168,0.02157013416290283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,5120,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,3072,0.018295466899871826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,2560,0.01713493267695109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,2048,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,512,0.016454399625460307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,2048,32,0.015155200163523355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,16384,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,65536,0.04829866488774617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,12288,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,8192,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,7168,0.02177493373552958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,5120,0.01986560026804606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,3072,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,2560,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,2048,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,64,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1536,32,0.015358933806419372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,16384,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,65536,0.04171093304951985
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,12288,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,10240,0.024371200799942018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,7168,0.021230934063593547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,6144,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,5120,0.020275199413299562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,4096,0.018569600582122803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,3584,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,2048,0.01658560037612915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,2560,0.016794667641321818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,768,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,512,0.0159061332543691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,128,0.015224533279736838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,1024,32,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,65536,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,16384,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,12288,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,10240,0.023893332481384276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,6144,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,5120,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,2560,0.01699840029080709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,2048,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,768,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,256,0.015292800466219583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,64,0.015631999572118124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,768,32,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,16384,0.02553173303604126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,65536,0.036933334668477376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,12288,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,10240,0.023481599489847817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,6144,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,5120,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,2560,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,2048,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,768,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,512,32,0.015155200163523355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,65536,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,16384,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,10240,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,12288,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,8192,0.022296533981959025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,7168,0.02116480072339376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,6144,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,5120,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,3584,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,2048,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,2560,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,768,0.015359999736150107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,256,32,0.014403200149536133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,65536,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,12288,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,16384,0.02368746598561605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,10240,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,7168,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,5120,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,4096,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,3584,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,3072,0.01781760056813558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,1024,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,768,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,256,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,128,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,32,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,128,64,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,65536,0.03051519989967346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,16384,0.02362026572227478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,12288,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,10240,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,8192,0.020682666699091592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,7168,0.020820266008377074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,5120,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,4096,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,3584,0.018637865781784058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,2560,0.018023467063903807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,2048,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,5120,1024,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,512,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,64,64,0.015631999572118124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,65536,0.030037333567937214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,16384,0.024370133876800537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,10240,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,12288,0.02198186715443929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,8192,0.021229867140452066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,6144,0.020614399512608846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,3584,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,2560,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,2048,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,1024,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,256,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,128,0.016089600324630738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,32,32,0.015474133690198264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,64,3584,10240,0.027784534295399982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,16384,0.20421973864237467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,12288,0.15783252716064453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,10240,0.13284266789754232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,8192,0.11100052992502848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,7168,0.09857707023620606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,6144,0.08714026610056559
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,5120,0.07553706963857015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,4096,0.06905173460642497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,3584,0.05857280095418295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,3072,0.05304319858551025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,1536,0.03652160167694092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,2560,0.0478549321492513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,1024,0.028945066531499225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,768,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,256,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,512,0.02286720077196757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,128,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,64,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,32,0.020553600788116456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,16384,0.06116799910863241
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,12288,0.05034773349761963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,65536,0.21220693588256836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,10240,0.04464639822642009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,8192,0.039049601554870604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,7168,0.036999468008677164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,6144,0.03297280073165894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,4096,0.027852799495061236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,5120,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,3584,0.02614293297131856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,3072,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,2560,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,1536,0.021943465868632
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,1024,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,512,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,256,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,128,0.015498666961987814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,16384,32,0.016385066509246825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,16384,0.054681599140167236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,12288,0.04471466541290283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,65536,0.16233493487040201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,10240,0.040484265486399336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,8192,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,6144,0.03140373428662618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,5120,0.028809599081675213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,7168,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,4096,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,3584,0.02532373269399007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,3072,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,2560,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,2048,0.021846399704615275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,1536,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,768,0.017205333709716795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,12288,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,16384,0.04686506589253743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,65536,0.14834346771240234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,12288,0.03911786476771037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,10240,0.03659093379974365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,8192,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,6144,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,7168,0.029014400641123456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,5120,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,4096,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,3584,0.024098134040832518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,2560,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,1536,0.017887999614079796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,1024,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,128,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,64,0.016581333676973977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,10240,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,16384,0.043281066417694095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,65536,0.12110293706258138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,12288,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,10240,0.032631466786066696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,8192,0.028603732585906982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,7168,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,6144,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,5120,0.02491733431816101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,3584,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,3072,0.021708800395329794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,2560,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,2048,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,1536,0.01665600041548411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,1024,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,768,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,512,0.01699840029080709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,64,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,128,0.01556373337904612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,8192,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,12288,0.03365653355916341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,16384,0.04403306643168132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,65536,0.10455146630605061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,10240,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,7168,0.026419200499852497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,8192,0.02723840077718099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,6144,0.024848000208536784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,5120,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,3584,0.022663466135660806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,3072,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,2048,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,2560,0.020275199413299562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,1536,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,1024,0.01665600041548411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,768,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,256,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,128,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,64,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,7168,32,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,16384,0.040209066867828366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,12288,0.03543039957682292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,65536,0.09413973490397134
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,8192,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,10240,0.030855466922124226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,7168,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,6144,0.02519039909044902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,5120,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,3584,0.022529067595799764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,2048,0.017339734236399333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,1024,0.016586666305859886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,256,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,6144,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,65536,0.08796266714731851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,16384,0.037275731563568115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,12288,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,10240,0.030923734108606975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,7168,0.025259733200073242
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,5120,0.023484800259272257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,6144,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,4096,0.020615466435750327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,1536,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,2048,0.017338667313257852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,512,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,256,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,128,0.01618026693662008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,5120,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,65536,0.0748533328374227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,16384,0.03406613270441691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,12288,0.030723200241724653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,8192,0.02471359968185425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,7168,0.024166399240493776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,5120,0.021913599967956544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,6144,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,4096,0.020482132832209267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,3584,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,2048,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,2560,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,4096,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,65536,0.0688810666402181
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,12288,0.030446932713190718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,16384,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,10240,0.026554665962855023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,7168,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,6144,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,5120,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,4096,0.01986560026804606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,3584,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,2048,0.018157867590586345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,2560,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,1536,0.01665600041548411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,512,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,256,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,64,0.015291733543078103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,128,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3584,32,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,65536,0.061713067690531406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,16384,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,12288,0.028534400463104247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,10240,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,7168,0.02368853290875753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,5120,0.02177600065867106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,4096,0.020275199413299562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,2560,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,2048,0.018295466899871826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,1536,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,256,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,3072,32,0.016065067052841185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,65536,0.05819733142852783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,12288,0.027376000086466474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,16384,0.029491200049718218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,10240,0.02648853262265523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,7168,0.023143466313680014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,5120,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,4096,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,2560,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,1536,0.016658133268356322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,2048,0.016794667641321818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,768,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,512,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,256,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,128,0.01495039959748586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2560,32,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,65536,0.05324800014495849
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,12288,0.027170133590698243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,16384,0.029627732435862225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,10240,0.02635093331336975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,8192,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,7168,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,5120,0.02006933291753133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,4096,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,1536,0.016587733229001363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,2048,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,2560,0.017270400126775106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,512,0.016179200013478598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,256,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,2048,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,65536,0.04730879863103231
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,12288,0.026691200335820515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,16384,0.027988266944885255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,10240,0.024781866868336996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,8192,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,7168,0.020958934227625528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,5120,0.020137600104014077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,2560,0.017204266786575318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,2048,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,768,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,512,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,256,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1536,32,0.015702399611473083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,65536,0.04526079893112182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,12288,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,16384,0.027033599217732747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,10240,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,7168,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,5120,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,4096,0.018771199385325114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,2560,0.01720106601715088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,1536,0.01651946703592936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,2048,0.01679253379503886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,1024,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,512,0.01576959987481435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,128,0.016314666469891867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,1024,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,65536,0.03870720068613688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,16384,0.02696533401807149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,12288,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,10240,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,8192,0.02177600065867106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,6144,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,5120,0.020206934213638304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,2560,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,2048,0.017339734236399333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,1024,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,512,0.016247466206550598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,256,0.015359999736150107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,768,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,65536,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,16384,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,10240,0.022795732816060385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,12288,0.024166399240493776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,8192,0.022459733486175536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,6144,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,2048,0.017886932690938315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,2560,0.0173418660958608
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,1536,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,768,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,256,0.01590506633122762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,128,0.016039466857910155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,65536,2048,0.04280426502227783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,64,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,65536,0.03652160167694092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,16384,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,12288,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,10240,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,7168,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,8192,0.02095680038134257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,6144,0.02116159995396932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,4096,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,3584,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,2048,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,2560,0.01700053413709005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,1024,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,512,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,768,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,256,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,128,0.016428800423940022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,64,0.015086932977040609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,256,32,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,65536,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,12288,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,16384,0.022665599981943764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,10240,0.020617600282033285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,8192,0.021504000822703043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,5120,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,3584,0.017953066031138103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,2560,0.017340799172719322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,1536,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,2048,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,1024,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,256,0.01576746702194214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,128,32,0.014459733168284097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,65536,0.031129600604375203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,16384,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,12288,0.021092265844345093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,10240,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,8192,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,6144,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,3072,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,2560,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,2048,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,512,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,128,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,64,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,32,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,65536,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,12288,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,16384,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,10240,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,8192,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,7168,0.021025067567825316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,6144,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,5120,0.020546134312947592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,4096,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,3072,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,2560,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,2048,0.01713493267695109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,1536,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,512,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,256,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,64,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,32,32,0.01638826628526052
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,16384,0.20107946395874024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,12288,0.15455573399861652
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,10240,0.12919572989145917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,8192,0.10943146546681722
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,7168,0.0963594675064087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,6144,0.08417387008666992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,5120,0.0736255963643392
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,4096,0.06481920083363851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,3584,0.056524801254272464
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,3072,0.05147306521733602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,2560,0.04645546674728394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,2048,0.04089173475901286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,1536,0.03502080043156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,768,0.024848000208536784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,1024,0.028398933013280232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,512,0.023552000522613525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,256,0.019182932376861573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,128,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,65536,32,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,16384,0.05894826650619507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,65536,0.2035370667775472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,12288,0.04901440143585205
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,8192,0.03864213228225708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,10240,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,7168,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,6144,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,5120,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,4096,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,3584,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,2560,0.024029866854349772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,3072,0.024641066789627075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,2048,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,16384,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,16384,0.05550080140431722
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,65536,0.1540778636932373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,12288,0.04693333307902019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,10240,0.043825066089630126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,7168,0.03263253370920817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,8192,0.03338239987691243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,6144,0.029286400477091475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,5120,0.028603732585906982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,3584,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,3072,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,2048,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,1536,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,768,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,256,0.016775466998418174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,128,0.015837867061297098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,64,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,12288,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,65536,0.1411754608154297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,16384,0.0527018666267395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,12288,0.043486932913462326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,10240,0.03583999872207642
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,8192,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,7168,0.029421865940093994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,6144,0.028602667649586994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,4096,0.026349866390228273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,5120,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,3584,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,2560,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,2048,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,1536,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,1024,0.01772800087928772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,768,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,64,0.01576959987481435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,10240,32,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,16384,0.0409610668818156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,65536,0.11175466378529866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,12288,0.0343392014503479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,8192,0.028467200199762982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,6144,0.02648640076319377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,7168,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,3584,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,3072,0.021934932470321654
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,2560,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,1536,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,2048,0.018295466899871826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,1024,0.01658986707528432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,768,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,8192,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,16384,0.04089173475901286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,65536,0.09963520367940268
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,12288,0.032631466786066696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,10240,0.029286400477091475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,8192,0.026895999908447266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,6144,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,7168,0.025803732872009277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,5120,0.02430400053660075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,4096,0.02218773365020752
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,3072,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,2560,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,2048,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,1536,0.017409066359202065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,768,0.016454399625460307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,128,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,7168,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,16384,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,65536,0.08823359807332357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,12288,0.03440746863683065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,10240,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,8192,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,6144,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,5120,0.023075199127197264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,4096,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,3584,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,3072,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,2560,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,1536,0.01836479902267456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,2048,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,1024,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,256,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,6144,64,0.015086932977040609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,16384,0.03672746817270915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,65536,0.0827392021814982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,10240,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,12288,0.03140053351720174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,8192,0.02567039926846822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,512,5120,0.019387733936309815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,6144,0.02368853290875753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,5120,0.021504000822703043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,3584,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,1536,0.01761386593182882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,1024,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,128,0.015415466825167336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,64,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,5120,32,0.016754132509231568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,16384,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,12288,0.02874773343404134
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,65536,0.06969813505808511
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,10240,0.027990400791168213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,8192,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,7168,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,6144,0.02429866592089335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,3584,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,3072,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,2048,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,2560,0.017272533973058064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,1024,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,256,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,4096,32,0.016450132926305136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,65536,0.0639306664466858
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,12288,0.028945066531499225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,16384,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,10240,0.026625066995620728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,8192,0.026215465863545735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,7168,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,5120,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,3072,0.017748266458511353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,2048,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,2560,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,512,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,128,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3584,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,65536,0.058265598615010586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,48,64,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,12288,0.028328533967336016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,16384,0.029286400477091475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,10240,0.02614506681760152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,7168,0.023142399390538533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,8192,0.024166399240493776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,6144,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,5120,0.019594667355219524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,3584,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,4096,0.01966080069541931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,3072,0.017887999614079796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,2560,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,2048,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,1536,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,256,0.016428800423940022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,32,0.015291733543078103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,3072,64,0.015564800302187601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,65536,0.055637331803639736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,16384,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,12288,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,8192,0.023961599667867026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,10240,0.025804799795150758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,7168,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,6144,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,3072,0.01686506668726603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,1536,0.01658986707528432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,1024,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,512,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,65536,0.04925440152486165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,12288,0.027306665976842243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,16384,0.02908160090446472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,10240,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,6144,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,5120,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,3072,0.01781760056813558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,2048,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,512,0.015222400426864624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,256,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,64,0.015848533312479655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2048,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,65536,0.04375893274943034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,16384,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,10240,0.024098134040832518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,5120,0.01952426632245382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,3584,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,3072,0.017339734236399333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,2048,0.017816533644994102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,2560,0.017612799008687337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,768,0.017407999436060587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,256,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,128,0.015496533115704855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,64,0.015221333503723145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1536,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,65536,0.03741013209025065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,12288,0.02430400053660075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,16384,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,10240,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,8192,0.022392533222834268
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,7168,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,2048,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,2560,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,1024,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,512,0.014881066481272378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,1024,64,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,65536,0.0373418649037679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,16384,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,12288,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,10240,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,7168,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,5120,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,3584,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,2560,0.01699733336766561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,2048,0.01713599960009257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,768,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,512,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,128,0.015564800302187601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,768,64,0.015156267086664834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,65536,0.033928533395131424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,16384,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,12288,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,10240,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,8192,0.02239360014597575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,7168,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,4096,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,3072,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,3584,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,2048,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,2560,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,1536,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,1024,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,768,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,512,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,256,0.016591999928156534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,128,0.015154133240381876
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,512,64,0.014814933141072592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,65536,0.032358400026957196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,16384,0.022665599981943764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,12288,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,8192,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,6144,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,5120,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,4096,0.01972800095876058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,3584,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,2560,0.01693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,2048,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,1536,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,65536,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,16384,0.021640533208847047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,12288,0.021913599967956544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,7168,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,6144,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,5120,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,3584,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,3072,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,2560,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,2048,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,768,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,512,0.01597653329372406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,256,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,128,0.014882133404413859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,64,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,128,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,16384,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,65536,0.027170133590698243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,12288,0.02068586746851603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,10240,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,7168,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,4096,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,3584,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,3072,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,2560,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,2048,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,128,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,65536,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,16384,0.02129813234011332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,12288,0.021640533208847047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,8192,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,7168,0.020617600282033285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,5120,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,3584,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,3072,0.018295466899871826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,2560,0.01795413295427958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,2048,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,512,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,256,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,128,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,32,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,16384,0.16404693921407063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,12288,0.12810239791870118
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,10240,0.11062506834665935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,8192,0.09134079615275065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,7168,0.08219306468963623
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,6144,0.0736255963643392
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,5120,0.06458026568094889
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,4096,0.05587519804636637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,3584,0.051336534818013514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,3072,0.04710400104522705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,2560,0.04286933342615763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,2048,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,1536,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,1024,0.02682773272196452
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,768,0.02532586654027303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,512,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,256,0.019796266158421835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,128,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,64,0.019113600254058838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,65536,32,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,65536,0.19118080139160157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,16384,0.05847040017445883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,12288,0.04782079855600993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,10240,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,8192,0.03802560170491536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,7168,0.03502080043156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,6144,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,5120,0.03031040032704671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,4096,0.027374933163324993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,3584,0.02519039909044902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,3072,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,2560,0.024167466163635253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,2048,0.022459733486175536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,1536,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,1024,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,128,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,16384,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,65536,0.15045973459879558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,16384,0.05307626724243164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,12288,0.04464639822642009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,10240,0.04109653234481812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,8192,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,2560,64,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,7168,0.034815998872121175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,6144,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,5120,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,4096,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,3584,0.024685867627461753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,2560,0.0230730672677358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,3072,0.02409706711769104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,2048,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,1536,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,1024,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,768,0.017339734236399333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,12288,32,0.017106133699417114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,16384,0.04723946650822957
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,65536,0.13298346996307372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,12288,0.0413696010907491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,10240,0.03809279998143514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,8192,0.034134399890899655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,7168,0.03297280073165894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,6144,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,5120,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,4096,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,3584,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,3072,0.023209599653879802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,2560,0.022835199038187662
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,1024,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,768,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,256,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,10240,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,65536,0.10661333401997883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,16384,0.03805013497670491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,12288,0.03399680058161418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,8192,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,7168,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,5120,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,6144,0.025496532519658405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,3584,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,4096,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,3072,0.02129813234011332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,2048,0.018488534291585288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,1536,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,768,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,512,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,256,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,8192,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,65536,0.09588053226470947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,16384,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,12288,0.03222186764081319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,10240,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,6144,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,5120,0.023550933599472045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,4096,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,3584,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,2560,0.018772266308466592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,2048,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,1536,0.01658986707528432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,512,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,7168,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,65536,0.0841386636098226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,16384,0.036659200986226395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,12288,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,8192,0.026419200499852497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,7168,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,6144,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,5120,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,4096,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,256,512,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,2560,0.018706132968266807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,1024,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,1536,0.01699840029080709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,768,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,128,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,64,0.016476800044377647
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,6144,32,0.014812800288200378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,16384,0.03522666692733765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,65536,0.07949653466542562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,12288,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,10240,0.02949013312657674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,8192,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,7168,0.022940800587336222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,6144,0.023483733336130776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,5120,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,2560,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,2048,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,1024,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,512,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,256,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,32,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,5120,64,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,65536,0.06601599852244058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,16384,0.031129600604375203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,10240,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,7168,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,5120,0.020958934227625528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,4096,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,3584,0.01761386593182882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,2048,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,1024,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,768,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,256,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,512,0.015564800302187601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,128,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,4096,32,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,32,64,256,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,16384,0.02956053415934245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,65536,0.06119893391927084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,12288,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,8192,0.026555732885996504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,7168,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,10240,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,5120,0.02032426595687866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,4096,0.01885333259900411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,6144,0.02286613384882609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,3072,0.018547199169794717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,2560,0.018615466356277467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,3584,0.01811306675275167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,2048,0.01656426688035329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,1536,0.016755199432373045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,1024,0.01671253244082133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,768,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,256,0.0165802667538325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,128,0.016531200210253397
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,64,0.016448000073432924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3584,32,0.01644480029741923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,16384,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,65536,0.0549888014793396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,12288,0.02648640076319377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,8192,0.025259733200073242
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,7168,0.023277866840362548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,10240,0.025940267244974773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,6144,0.022516266504923502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,5120,0.019899733861287437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,4096,0.018819200992584228
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,3584,0.017940266927083334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,2048,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,3072,0.018281600872675576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,1536,0.016424533724784852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,1024,0.01640959978103638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,768,0.016671999295552572
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,256,0.01646719972292582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,512,0.015401599804560342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,128,0.016463999946912132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,64,0.01656000018119812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,32,0.01486186683177948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,65536,0.051541332403818765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,16384,0.02723840077718099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,12288,0.02600853244463603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,8192,0.023961599667867026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,10240,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,6144,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,5120,0.018554667631785073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,4096,0.01957226594289144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,3584,0.017666133244832356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,3072,0.018423465887705485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,2560,0.018345600366592406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,2048,0.016643200318018594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,1536,0.016780799627304076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,1024,0.016565333803494772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,512,0.01595093309879303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,256,0.01646613379319509
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,64,0.01648640036582947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,128,0.016436266899108886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2560,32,0.014754133423169455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,65536,0.046830932299296066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,16384,0.02519039909044902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,12288,0.026898133754730224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,8192,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,7168,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,6144,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,5120,0.01858133276303609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,3072,0.017963733275731406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,2560,0.018481065829594932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,1536,0.016976000865300496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,2048,0.0166293332974116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,1024,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,768,0.016049066185951234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,512,0.016598400473594666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,256,0.015413332978884378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,128,0.016509866714477538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,64,0.01650879979133606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,32,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,16384,0.028537599245707194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,65536,0.04082346757253011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,12288,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,10240,0.024359466632207234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,8192,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,7168,0.020522665977478028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,6144,0.02020906607309977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,4096,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,5120,0.01849386692047119
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,3584,0.018487467368443807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,3072,0.01809813380241394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,2560,0.018480000893274943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,2048,0.016438399751981102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,1536,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,1024,0.016382933656374613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,768,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,512,0.015225600202878317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1536,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,65536,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,16384,0.025602134068806966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,12288,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,10240,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,8192,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,6144,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,5120,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,4096,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,3584,0.020206934213638304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,1536,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,256,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,64,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,1024,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,65536,0.03877546787261963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,16384,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,12288,0.021227733294169108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,10240,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,8192,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,2560,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,2048,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,1536,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,768,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,256,0.014802133043607077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,128,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,768,32,0.01647040049235026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,65536,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,16384,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,10240,0.021913599967956544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,3584,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,2560,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,1536,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,768,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,512,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,256,0.01495039959748586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,64,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,512,32,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,65536,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,16384,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,8192,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,5120,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,4096,0.020139733950297035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,3584,0.01672640045483907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,2560,0.017339734236399333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,1024,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,768,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,512,0.016160000363985697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,256,0.015214932958285013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,256,32,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,65536,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,16384,0.020891733964284263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,12288,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,8192,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,6144,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,5120,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,4096,0.020617600282033285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,3584,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,3072,0.01836479902267456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,2560,0.016521599888801575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,1536,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,512,0.01604480048020681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,256,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,64,0.0159061332543691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,128,32,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,65536,0.026555732885996504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,16384,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,12288,0.019388800859451293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,8192,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,6144,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,5120,0.01918399930000305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,3584,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,3072,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,2560,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,1024,0.015564800302187601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,512,0.014472533265749613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,256,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,128,0.015634133418401083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,64,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,32,0.015564800302187601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,65536,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,16384,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,12288,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,10240,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,8192,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,7168,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,6144,0.018637865781784058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,5120,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,4096,0.018977065881093345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,3584,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,3072,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,2560,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,1536,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,1024,0.015631999572118124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,768,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,512,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,256,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,128,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,64,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,32,32,0.015564800302187601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,16384,0.1837056001027425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,12288,0.14629546801249188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,10240,0.10919253031412761
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,8192,0.09052159786224365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,7168,0.08147626717885335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,6144,0.07246507008870443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,5120,0.06324906746546427
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,4096,0.05447680155436198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,3584,0.05048319896062216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,3072,0.046011734008789065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,2560,0.04116373459498088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,2048,0.03659093379974365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,1536,0.032494932413101196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,3072,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,1024,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,768,0.024918399254480996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,512,0.022050132354100548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,256,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,64,0.019387733936309815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,65536,32,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,16384,0.06410239934921265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,65536,0.185208527247111
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,12288,0.045602134863535565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,10240,0.04177920023600261
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,8192,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,7168,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,6144,0.0318122665087382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,5120,0.029491200049718218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,3584,0.02621440092722575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,3072,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,2560,0.02327893376350403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,2048,0.021028266350428263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,1536,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,768,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,1024,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,64,0.016179200013478598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,16384,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,2048,4096,0.01795413295427958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,16384,0.05263359944025675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,65536,0.14560532569885254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,12288,0.043281066417694095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,10240,0.04075733423233032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,8192,0.03577173153559367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,7168,0.03331413269042969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,6144,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,5120,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,4096,0.024779733022054037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,3584,0.02362026572227478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,2048,0.020888533194859824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,1536,0.01802240014076233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,1024,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,512,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,256,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,128,0.01644159952799479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,64,0.016438399751981102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,12288,32,0.016479999820391337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,12288,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,16384,0.046011734008789065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,65536,0.12702186902364093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,10240,0.0373418649037679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,7168,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,8192,0.0332479993502299
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,6144,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,5120,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,4096,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,3584,0.023891200621922813
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,3072,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,2560,0.02177813251813253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,1536,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,768,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,1024,0.01836479902267456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,512,0.015552000204722086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,256,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,64,0.015837867061297098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,10240,32,0.016450132926305136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,16384,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,12288,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,65536,0.1025696039199829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,10240,0.03003840049107869
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,8192,0.026964267094930012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,7168,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,6144,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,5120,0.024372265736262003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,3584,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,4096,0.022938666741053264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,3072,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,2560,0.019933867454528808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,1536,0.01713386575380961
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,2048,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,768,0.016500266393025716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,1024,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,256,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,64,0.016438399751981102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,8192,32,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,65536,0.0921610673268636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,12288,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,16384,0.0373418649037679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,10240,0.02867199977238973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,8192,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,6144,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,5120,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,4096,0.021640533208847047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,3072,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,2560,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,512,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,64,0.016459733247756958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,7168,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,65536,0.0836949348449707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,12288,0.03242666721343994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,16384,0.03496640125910441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,10240,0.029626667499542236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,8192,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,7168,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,5120,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,6144,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,4096,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,3584,0.022050132354100548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,3072,0.018567466735839845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,2560,0.01651946703592936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,2048,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,768,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,512,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,256,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,6144,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,65536,0.07471786340077718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,16384,0.033928533395131424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,12288,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,10240,0.027508266766866046
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,7168,0.023962666591008507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,8192,0.024771199623743693
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,5120,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,6144,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,3584,0.02034239967664083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,2560,0.01699733336766561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,2048,0.01781546672185262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,1536,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,512,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,64,0.01576959987481435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,5120,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,65536,0.06212160189946493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,16384,0.029764266808827718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,7168,0.025051732858022053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,8192,0.02519039909044902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,6144,0.023484800259272257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,5120,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,4096,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,3072,0.0198634664217631
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,3584,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,2048,0.018526933590571084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,1536,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,768,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,1024,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,512,0.015277866522471109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,256,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,64,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,128,0.01648319959640503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,4096,32,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,65536,0.05645653406778971
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,16384,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,12288,0.02696533401807149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,10240,0.025872000058492023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,8192,0.024779733022054037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,6144,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,5120,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,3072,0.019795199235280357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,1536,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,512,0.015154133240381876
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,64,0.015836800138155617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,256,0.016179200013478598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3584,32,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,65536,0.05130240122477213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,16384,0.027989333868026732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,12288,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,16,64,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,8192,0.02491733431816101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,6144,0.021707733472188316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,5120,0.02259413401285807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,4096,0.01986560026804606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,3072,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,2560,0.019592533508936562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,1536,0.017338667313257852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,512,0.01647040049235026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,256,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,64,0.016948266824086507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,3072,32,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,12288,0.02553279995918274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,65536,0.04829866488774617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,16384,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,8192,0.024098134040832518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,6144,0.02102400064468384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,4096,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,3584,0.019773866732915243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,3072,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,2048,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,512,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,256,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,128,0.016438399751981102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,64,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2560,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,16384,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,65536,0.04341760079065959
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,10240,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,8192,0.021501866976420085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,6144,0.02027626633644104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,5120,0.020205867290496827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,3584,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,2560,0.01854506731033325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,3072,0.018567466735839845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,1536,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,1024,0.016838399569193523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,768,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,512,0.015496533115704855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,128,0.01644373337427775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,32,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,2048,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,65536,0.037478399276733396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,16384,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,12288,0.02512213389078776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,8192,0.021436800559361778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,7168,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,6144,0.019591466585795084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,4096,0.019796266158421835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,3584,0.01952426632245382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,3072,0.017679999272028603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,2560,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,2048,0.017272533973058064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,1024,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,512,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,768,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,128,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,32,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,65536,0.03304106593132019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,16384,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,8192,0.020823466777801513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,7168,0.020615466435750327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,5120,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,3584,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,3072,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,1536,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,1024,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,512,0.014936533570289613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,256,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,32,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1024,64,0.015224533279736838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,65536,0.036111998558044436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,16384,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,6144,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,4096,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,2560,0.017612799008687337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,1536,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,2048,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,1024,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,512,0.014816000064214071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,64,0.014816000064214071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,768,32,0.015768532951672874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,65536,0.03146986762682597
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,16384,0.021911466121673585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,8192,0.020683733622233073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,7168,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,5120,0.021230934063593547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,3584,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,2560,0.016793600718180337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,1536,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,768,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,128,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,512,32,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,65536,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,16384,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,5120,0.020206934213638304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,4096,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,3584,0.01877440015474955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,3072,0.01781760056813558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,2560,0.017885865767796834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,768,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,512,0.015225600202878317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,128,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,64,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,256,32,0.014402133226394654
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,16384,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,65536,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,12288,0.020002132654190062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,8192,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,5120,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,6144,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,4096,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,3584,0.016999467213948568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,3072,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,2560,0.01802240014076233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,1024,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,768,0.014816000064214071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,128,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,256,0.0159061332543691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,128,32,0.01570026675860087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,65536,0.023961599667867026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,16384,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,12288,0.01904639999071757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,10240,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,7168,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,5120,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,6144,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,3584,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,3072,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,2048,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,1024,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,1536,0.016371200482050575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,512,0.01474666694800059
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,256,0.015222400426864624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,64,0.015564800302187601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,64,32,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,65536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,16384,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,10240,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,8192,0.018705066045125326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,4096,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,5120,0.01952426632245382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,6144,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,3072,0.017066667477289833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,2048,0.016497066617012023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,1024,0.015703466534614564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,512,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,256,0.015224533279736838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,64,0.01495039959748586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,32,32,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,12288,0.14431573549906412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,16384,0.18090559641520182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,10240,0.12458453178405762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,8192,0.09321706295013428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,6144,0.07594666481018067
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,7168,0.08394986788431803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,5120,0.06669653256734212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,4096,0.057342934608459475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,3584,0.05123413403828939
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,3072,0.047446401913960774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,2560,0.0428000013033549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,2048,0.03665813207626343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,1536,0.031949865818023684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,1024,0.028467200199762982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,512,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,256,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,64,0.01938986579577128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,32,0.019318399826685588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,16384,0.06410239934921265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,65536,0.1817962646484375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,12288,0.04614826838175456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,10240,0.04109653234481812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,8192,0.0370688001314799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,7168,0.03379199902216594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,6144,0.032631466786066696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,5120,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,4096,0.02757973273595174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,3584,0.02539520064989726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,3072,0.025462400913238526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,1024,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,512,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,16384,32,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,16384,0.05331626733144125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,65536,0.14267733891805012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,12288,0.04389546712239583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,10240,0.039185067017873124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,8192,0.036659200986226395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,7168,0.03310933311780294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,6144,0.03222506642341614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,5120,0.029422932863235475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,4096,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,3584,0.023142399390538533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,3072,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,2048,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,1536,0.01713706652323405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,1024,0.016587733229001363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,768,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,128,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,64,0.016316800316174825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,12288,32,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,16384,0.04635519981384277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,65536,0.12328960100809734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,12288,0.04082346757253011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,10240,0.036931200822194414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,8192,0.03338239987691243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,7168,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,6144,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,5120,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,4096,0.02539520064989726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,3584,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,3072,0.022731733322143555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,2048,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,768,0.016436266899108886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,256,0.01556373337904612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,10240,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,16384,0.03782080014546712
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,65536,0.10134293238321941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,12288,0.03290560046831767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,10240,0.03031146725018819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,8192,0.027784534295399982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,7168,0.025124265750249224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,6144,0.024779733022054037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,5120,0.023756800095240276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,3584,0.02130026618639628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,3072,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,2560,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,1024,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,512,0.016434133052825928
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,128,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,8192,32,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,65536,0.09007786909739177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,16384,0.039185067017873124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,12288,0.031061333417892457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,10240,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,8192,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,7168,0.026074665784835815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,5120,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,6144,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,4096,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,2560,0.017813332875569663
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,2048,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,1536,0.01658986707528432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,256,0.015621333320935567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,64,0.016247466206550598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,7168,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,65536,0.08338773250579834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,16384,0.035499731699625656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,12288,0.032153600454330446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,8192,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,7168,0.024781866868336996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,5120,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,6144,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,4096,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,3072,0.020478934049606323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,2048,0.017339734236399333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,1536,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,1024,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,8,1536,5120,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,512,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,128,0.01597546637058258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,64,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,6144,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,65536,0.07249600092569987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,10240,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,8192,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,6144,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,5120,0.021640533208847047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,3072,0.018633600076039633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,3584,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,1536,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,1024,0.016314666469891867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,512,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,256,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,128,0.01604373355706533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,32,0.0159061332543691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,16384,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,65536,0.06434133450190226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,12288,0.028535467386245728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,10240,0.026897066831588747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,7168,0.024781866868336996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,8192,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,5120,0.02218559980392456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,4096,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,2560,0.01911466717720032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,1024,0.018227199713389076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,768,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,512,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,128,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,64,0.016247466206550598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,4096,32,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,65536,0.056251732508341465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,16384,0.029765333731969195
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,12288,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,7168,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,6144,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,5120,0.021230934063593547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,2560,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,3072,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,1024,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,64,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3584,32,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,65536,0.050928000609079996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,16384,0.028603732585906982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,12288,0.025942399104436235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,10240,0.02553173303604126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,8192,0.023552000522613525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,7168,0.023483733336130776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,6144,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,5120,0.020683733622233073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,3584,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,3072,0.018703999121983846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,2560,0.01863573392232259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,2048,0.016658133268356322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,1536,0.017748266458511353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,768,0.01693120002746582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,256,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,128,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,32,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,65536,0.04928853511810303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,16384,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,10240,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,6144,0.02075200080871582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,5120,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,3584,0.019592533508936562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,3072,0.01884053349494934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,2560,0.017885865767796834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,2048,0.01713493267695109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,128,0.015156267086664834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,64,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2560,32,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,65536,0.04328213135401408
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,16384,0.025667200485865276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,12288,0.024439465999603272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,10240,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,8192,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,6144,0.019933867454528808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,5120,0.01911466717720032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,65536,768,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,3072,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,2560,0.01740586757659912
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,256,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,128,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,2048,32,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,16384,0.027716267108917236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,65536,0.03672746817270915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,10240,0.0211626668771108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,7168,0.020822399854660036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,6144,0.019798400004704793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,5120,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,4096,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,3072,0.017612799008687337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,768,0.016437333822250367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,512,0.016437333822250367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,128,0.014677332838376364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1536,32,0.016314666469891867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,65536,0.031267199913660684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,16384,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,8192,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,6144,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,5120,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,4096,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,3584,0.019387733936309815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,512,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,1024,32,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,65536,0.03515733480453491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,12288,0.021233065923055013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,16384,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,8192,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,2560,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,3072,0.01761386593182882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,1536,0.01720213294029236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,256,0.015359999736150107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,128,0.015837867061297098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,32,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,768,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,65536,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,16384,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,7168,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,6144,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,5120,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,3072,0.017884800831476845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,3584,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,2560,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,1024,0.015565866231918335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,64,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,128,0.014817066987355552
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,512,32,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,65536,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,16384,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,12288,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,10240,0.020002132654190062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,8192,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,7168,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,5120,0.01904426614443461
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,6144,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,3584,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,3072,0.017475199699401856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,2560,0.016863999764124553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,1024,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,512,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,768,0.015631999572118124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,128,0.016382933656374613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,64,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,256,32,0.014732799927393594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,65536,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,16384,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,12288,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,10240,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,8192,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,6144,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,7168,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,5120,0.018567466735839845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,4096,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,5120,12288,0.030583467086156207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,3584,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,3072,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,1536,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,768,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,256,0.01611199975013733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,128,0.015636266271273295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,16384,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,65536,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,128,32,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,10240,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,8192,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,7168,0.019388800859451293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,6144,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,5120,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,3584,0.01672533353169759
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,3072,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,2048,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,1024,0.01604159971078237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,256,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,128,0.01609386702378591
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,64,32,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,65536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,16384,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,12288,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,10240,0.020071466763814293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,8192,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,6144,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,7168,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,5120,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,3584,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,3072,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,1536,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,1024,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,768,0.015018666783968607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,256,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,128,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,32,32,0.016317866245905557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,12288,0.1411754608154297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,10240,0.12243626912434895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,16384,0.17940479914347332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,6144,0.07536640167236328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,7168,0.08553813298543295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,8192,0.10318293571472167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,5120,0.06570666631062826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,4096,0.0553984006245931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,3584,0.051575465997060144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,3072,0.04642026821772258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,2560,0.0413696010907491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,2048,0.03652373154958089
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,1536,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,1024,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,768,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,512,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,256,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,64,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,32,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,65536,128,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,16384,0.06277333498001099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,12288,0.04700160026550293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,65536,0.18063146273295086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,10240,0.04157439867655437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,8192,0.03672746817270915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,7168,0.03515733480453491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,6144,0.03242666721343994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,5120,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,3584,0.024781866868336996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,3072,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,256,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,128,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,4,3072,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,16384,0.051780267556508386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,12288,0.04444160064061482
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,65536,0.1406976064046224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,10240,0.039662933349609374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,8192,0.037614933649698895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,7168,0.0347488005956014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,6144,0.0315391997496287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,5120,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,3584,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,4096,0.024371200799942018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,2560,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,2048,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,768,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,256,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,128,0.015428266922632852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,12288,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,65536,0.12178773085276287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,16384,0.0460810661315918
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,12288,0.040139734745025635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,10240,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,8192,0.03386026620864868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,7168,0.03270080089569092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,5120,0.02949013312657674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,6144,0.03126613299051921
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,3072,0.02362026572227478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,2560,0.020822399854660036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,2048,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,1024,0.017612799008687337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,512,0.015634133418401083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,64,0.015564800302187601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,32,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,65536,0.09956586360931396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,16384,0.037750399112701415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,12288,0.03297386765480041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,10240,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,8192,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,7168,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,6144,0.024714666604995727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,5120,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,4096,0.021912533044815063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,3584,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,3072,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,2560,0.019182932376861573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,2048,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,1536,0.01679146687189738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,256,0.016317866245905557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,64,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,8192,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,65536,0.0886783997217814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,16384,0.037750399112701415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,12288,0.03113173246383667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,10240,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,8192,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,7168,0.026077866554260254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,6144,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,5120,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,4096,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,3072,0.019592533508936562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,2560,0.017407999436060587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,128,0.015838932991027833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,64,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,7168,32,0.01611199975013733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,65536,0.08130559921264649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,16384,0.035225598017374675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,12288,0.031948800881703696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,10240,0.029967999458312987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,7168,0.024372265736262003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,6144,0.023209599653879802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,5120,0.021913599967956544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,3584,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,3072,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,2560,0.01802240014076233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,1024,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,512,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,256,0.015156267086664834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,64,0.016247466206550598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,6144,32,0.016247466206550598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,65536,0.07263466517130533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,16384,0.03317653338114421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,12288,0.03065173427263896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,10240,0.028807467222213744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,8192,0.023347200949986775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,7168,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,3072,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,512,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,128,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,5120,32,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,65536,0.06109866698582968
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,16384,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,12288,0.02867199977238973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,7168,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,6144,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,4096,0.019318399826685588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,2560,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,2048,0.018295466899871826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,1536,0.01665600041548411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,768,0.015836800138155617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,512,0.016382933656374613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,256,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,64,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,4096,32,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,65536,0.057341865698496496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,16384,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,12288,0.02744320034980774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,10240,0.02635093331336975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,6144,0.02362026572227478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,5120,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,2048,0.01761386593182882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,1536,0.017476266622543334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,768,0.016382933656374613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,256,0.016247466206550598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,128,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,16384,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3584,32,0.01576959987481435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,65536,0.050962134202321374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,16384,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,12288,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,10240,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,8192,0.024371200799942018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,7168,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,4096,0.020206934213638304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,2560,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,2048,0.018295466899871826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,128,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,3072,32,0.015153066317240397
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,65536,0.048128000895182294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,16384,0.026691200335820515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,12288,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,10240,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,6144,0.021233065923055013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,5120,0.02081813414891561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,4096,0.01986560026804606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,3072,0.019317332903544107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,1024,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,1536,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,128,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,3584,0.023550933599472045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2560,32,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,65536,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,16384,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,12288,0.024166399240493776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,10240,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,7168,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,6144,0.020002132654190062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,5120,0.01863573392232259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,3584,0.019182932376861573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,1536,0.01843093236287435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,1024,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,768,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,512,0.016500266393025716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,2048,32,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,65536,0.036659200986226395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,16384,0.028331732749938963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,12288,0.02321066657702128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,10240,0.02245866656303406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,5120,0.01880426605542501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,4096,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,3584,0.018569600582122803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,2560,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,1536,0.017407999436060587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,768,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,65536,0.031129600604375203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,16384,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,12288,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,10240,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,7168,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,6144,0.020001065731048585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,5120,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,4096,0.019798400004704793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,3584,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,3072,0.019293866554896035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,1536,0.01775040030479431
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,1024,0.01651946703592936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,768,0.016658133268356322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,512,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,128,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1024,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,65536,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,16384,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,12288,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,6144,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,3072,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,2048,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,1536,0.01686186591784159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,768,32,0.01651946703592936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,65536,0.03058240016301473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,16384,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,12288,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,10240,0.021230934063593547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,8192,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,6144,0.020615466435750327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,4096,0.019523199399312338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,3072,0.017679999272028603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,2560,0.017679999272028603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,1536,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,256,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,512,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,65536,0.027033599217732747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,16384,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,10240,0.020413867632548013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,8192,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,7168,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,6144,0.020618667205174766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,5120,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,4096,0.01966080069541931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,3584,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,3072,0.01802240014076233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,2048,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,1536,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,1024,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,512,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,256,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,128,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,256,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,65536,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,16384,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,10240,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,8192,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,7168,0.020206934213638304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,6144,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,3584,0.017268266280492148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,3072,0.017953066031138103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,2048,0.01781760056813558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,1536,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,512,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,128,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,64,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,128,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,65536,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,16384,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,12288,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,8192,0.018499199549357095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,7168,0.02048106590906779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,6144,0.01986560026804606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,5120,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,3584,0.01843413313229879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,3072,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,2560,0.01692906618118286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,512,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,64,0.016437333822250367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,64,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,65536,0.022050132354100548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,16384,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,12288,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,10240,0.019182932376861573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,7168,0.01918399930000305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,6144,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,5120,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,4096,0.020206934213638304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,3584,0.01699519952138265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,3072,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,2048,0.016454399625460307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,1024,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,768,0.01644480029741923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,32,32,0.018228266636530557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,16384,0.17913173039754232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,12288,0.14083093007405598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,10240,0.12120746771494548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,8192,0.1047210693359375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,6144,0.07495786348978678
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,5120,0.06666239897410074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,4096,0.05669333140055338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,3584,0.05246293147404989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,3072,0.04727466503779094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,2560,0.04225706656773885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,2048,0.0370688001314799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,1536,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,1024,0.027373866240183516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,768,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,512,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,256,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,128,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,64,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,32,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,65536,0.18124799728393554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,16384,0.06273706754048666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,12288,0.04724053144454956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,10240,0.04171093304951985
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,8192,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,7168,0.03379199902216594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,6144,0.032356266180674234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,5120,0.029013333717981975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,3584,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,3072,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,2560,0.024371200799942018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,2048,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,1536,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,1024,0.01720213294029236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,768,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,16384,32,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,65536,0.1404256025950114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,16384,0.05147306521733602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,12288,0.043622398376464845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,10240,0.03932160139083862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,8192,0.0357045332590739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,7168,0.03379199902216594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,6144,0.031198932727177935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,5120,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,4096,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,10240,4096,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,3584,0.02430293361345927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,2048,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,1536,0.018363734086354576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,512,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,128,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,64,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,32,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,2,1536,7168,0.02211839954058329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,16384,0.04457813501358032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,65536,0.12100586891174317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,12288,0.03952639897664388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,10240,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,8192,0.03269973397254944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,7168,0.031470932563145954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,6144,0.030718932549158733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,5120,0.02956053415934245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,4096,0.02443839907646179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,3584,0.02437333265940348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,3072,0.022733867168426514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,2048,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,2560,0.022050132354100548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,1024,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,256,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,64,0.01590506633122762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,10240,32,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,65536,0.09885013103485107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,16384,0.038284798463185624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,10240,0.029626667499542236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,12288,0.03297280073165894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,8192,0.026900267601013182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,7168,0.026555732885996504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,5120,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,4096,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,3584,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,3072,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,2048,0.018498132626215615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,2560,0.01904639999071757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,1536,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,512,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,128,0.015634133418401083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,64,0.016247466206550598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,8192,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,65536,0.08918186823527018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,16384,0.03761599858601888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,12288,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,8192,0.025872000058492023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,6144,0.022802132368087768
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,4096,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,3584,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,3072,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,2048,0.017338667313257852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,64,0.01583999991416931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,65536,0.08089599609375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,16384,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,12288,0.03222399950027466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,10240,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,7168,0.022869332631429037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,6144,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,5120,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,3584,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,2560,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,2048,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,1536,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,128,0.0159061332543691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,64,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,6144,32,0.015838932991027833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,65536,0.07150826454162598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,16384,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,12288,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,10240,0.028467200199762982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,8192,0.023483733336130776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,6144,0.02204906741778056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,5120,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,4096,0.018773333231608073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,3584,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,2048,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,256,0.015702399611473083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,128,0.01604159971078237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,64,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,5120,32,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,65536,0.062498132387797035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,16384,0.030173865954081218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,10240,0.02621440092722575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,65536,7168,0.0857098658879598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,7168,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,6144,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,5120,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,3584,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,2560,0.020478934049606323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,3072,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,1536,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,256,0.01604480048020681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,64,0.01590826710065206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,4096,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,65536,0.05638826688130697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,16384,0.028945066531499225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,12288,0.02696533401807149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,7168,0.02648853262265523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,3072,0.018908800681432088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,2560,0.01904639999071757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,1024,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,512,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3584,32,0.016110933820406594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,65536,0.05178240140279135
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,16384,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,12288,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,7168,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,2560,0.020071466763814293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,1536,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,1024,0.017682133118311565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,512,0.016454399625460307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,256,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,64,0.015701333681742348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,3072,32,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,65536,0.04788906574249267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,16384,0.02696533401807149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,8192,0.023483733336130776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,6144,0.021571199099222817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,4096,0.020413867632548013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,3072,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,2560,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,1536,0.01795413295427958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,1024,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,768,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,256,0.0159061332543691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,64,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2560,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,65536,0.04300800164540609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,16384,0.02635093331336975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,12288,0.024098134040832518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,10240,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,7168,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,6144,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,3584,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,3072,0.020002132654190062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,12288,2560,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,2560,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,1024,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,512,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,32,0.016901334126790367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,2048,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,16384,0.026848000288009644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,65536,0.03686399857203166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,12288,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,10240,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,5120,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,3584,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,2560,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,2048,0.01816213329633077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,1536,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1536,32,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,65536,0.032358400026957196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,16384,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,12288,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,10240,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,8192,0.021504000822703043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,6144,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,5120,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,4096,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,3584,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,3072,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,2048,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,768,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,512,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,128,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,64,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,1024,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,65536,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,16384,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,12288,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,8192,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,10240,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,5120,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,3584,0.018564265966415406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,2560,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,2048,0.017749333381652833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,1024,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,768,0.016484266519546507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,512,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,256,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,128,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,64,0.01576959987481435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,768,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,65536,0.030583467086156207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,12288,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,16384,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,10240,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,7168,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,6144,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,5120,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,3072,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,2560,0.016520532965660095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,2048,0.017681066195170084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,512,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,256,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,128,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,64,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,32,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,65536,0.02566933234532674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,16384,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,10240,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,12288,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,8192,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,7168,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,6144,0.018634666999181114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,5120,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,7168,10240,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,3584,0.01713599960009257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,3072,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,768,0.016383999586105348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,512,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,256,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,32,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,65536,0.023509333531061806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,12288,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,16384,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,10240,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,8192,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,7168,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,6144,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,5120,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,3584,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,3072,0.0173418660958608
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,512,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,256,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,128,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,64,0.016179200013478598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,65536,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,128,32,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,16384,0.01945599913597107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,12288,0.018568533658981323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,10240,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,8192,0.01815999945004781
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,7168,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,5120,0.018976000944773357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,6144,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,4096,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,3584,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,3072,0.01693013310432434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,2560,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,1536,0.015631999572118124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,768,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,512,0.015291733543078103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,256,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,64,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,128,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,64,32,0.016453333695729575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,65536,0.020615466435750327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,16384,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,12288,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,10240,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,7168,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,8192,0.018636800845464072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,6144,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,5120,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,4096,0.018487467368443807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,3584,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,3072,0.01713493267695109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,2560,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,1536,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,1024,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,768,0.016315733393033348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,256,0.016451199849446617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,512,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,128,0.0159061332543691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,64,0.01562879979610443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,32,32,0.015974400440851848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,512,768,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,fp8,1,256,128,0.015292800466219583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,12288,2.94717534383138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,8192,1.8102954864501952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,10240,2.35393803914388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,16384,4.174441528320313
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,6144,1.3762901306152344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,5120,1.1524096171061198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,7168,1.5712938944498698
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,4096,0.9293173472086588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,3584,0.845141347249349
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,2560,0.6306133270263672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,3072,0.7432533264160156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,768,0.2988032023111979
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,1024,0.3478528022766113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,2048,0.5460639953613281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,128,0.1853439966837565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,256,0.20824747085571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,512,0.26419199307759605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,65536,1536,0.46148265202840166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,10240,0.7036928176879883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,12288,0.8322399775187174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,16384,1.0464938481648765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,8192,0.555076281229655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,7168,0.4549973487854004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,6144,0.3847509384155273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,4096,0.27265707651774085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,5120,0.3410943984985352
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,3584,0.236135466893514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,2560,0.18582186698913575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,3072,0.2135039965311686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,1024,0.10004479885101318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,1536,0.12974080244700115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,2048,0.1523039976755778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,256,0.06372586488723755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,768,0.08625493049621583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,512,0.07615253130594889
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,128,0.057479465007781984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,12288,0.6039541244506836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,16384,0.8230218887329102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,10240,0.49885867436726883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,8192,0.40236374537150066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,7168,0.34041172663370767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,6144,0.3089749336242676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,4096,0.21521174112955727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,5120,0.2566165288289388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,3584,0.1926143964131673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,3072,0.16377280553181967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,2048,0.12096853256225586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,2560,0.1472511927286784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,1536,0.10055680274963379
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,1024,0.07871146996816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,512,0.06113280057907104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,768,0.0672426700592041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,256,0.05259946584701538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,128,0.04693333307902019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,16384,0.6410581588745117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,16384,65536,5.571251424153646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,12288,0.48936961491902664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,10240,0.4138997395833333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,12288,65536,3.689302317301432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,8192,0.3203743934631348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,7168,0.2894506772359212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,4096,0.17769920031229655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,5120,0.2178058624267578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,6144,0.2564767996470133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,3072,0.1397429307301839
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,3584,0.15974399248758953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,2560,0.1255754629770915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,1024,0.06782293319702148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,1536,0.08659839630126953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,2048,0.1033567984898885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,768,0.058982400099436436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,256,0.045533867677052815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,512,0.05249706506729126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,128,0.04191679954528808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,12288,0.4033205350240071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,16384,0.5399893442789714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,10240,0.3397290547688802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,8192,0.27149651845296224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,10240,65536,2.9690218607584637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,7168,0.2447360038757324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,5120,0.18967893918355305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,6144,0.21377813021341957
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,4096,0.15209706624348956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,3584,0.13786452611287434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,3072,0.11980586846669514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,1536,0.07369386355082194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,2048,0.08956586519877116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,2560,0.10659840106964111
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,1024,0.057207465171813965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,768,0.04966613451639811
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,512,0.045261867841084796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,128,0.037205334504445395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,256,0.040482131640116374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,12288,0.350378672281901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,16384,0.47974294026692704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,10240,0.29593601226806643
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,8192,0.24145919481913247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,7168,0.21411733627319335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,6144,0.1917952060699463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,4096,0.13509972890218097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,5120,0.16582080523173015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,3072,0.10673493544260662
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,3584,0.12178773085276287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,2048,0.07946346600850424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,2560,0.09335467020670572
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,8192,65536,2.2163477579752606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,768,0.04444053173065186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,1024,0.05120000044504801
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,1536,0.06649279991785685
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,512,0.04020800193150838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,256,0.036865067481994626
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,128,0.034065067768096924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,12288,0.3217407862345377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,16384,0.4103850682576497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,10240,0.2756597201029459
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,8192,0.21957972844441734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,7168,0.20032854080200196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,6144,0.17448959350585938
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,7168,65536,1.9251562754313152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,5120,0.15619413057963055
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,4096,0.12311893304189045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,3584,0.11373120148976643
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,2560,0.08659626642862955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,3072,0.09980586369832357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,2048,0.0740010658899943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,1024,0.04751253525416056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,1536,0.06085973183314005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,512,0.03768213192621867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,768,0.04150613149007161
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,256,0.034473601977030435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,128,0.032017066081364946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,12288,0.27395413716634115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,16384,0.3553621292114258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,10240,0.23558826446533204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,8192,0.1885855992635091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,7168,0.17162240346272786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,6144,0.1510741392771403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,5120,0.1346218744913737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,4096,0.10728106498718262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,6144,65536,1.6446805318196613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,3072,0.08523093064626058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,2560,0.07447893619537353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,3584,0.0974506696065267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,1024,0.04130133390426636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,1536,0.05287253459294637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,2048,0.06352106730143228
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,512,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,768,0.03590933481852214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,128,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,256,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,12288,0.22326614061991373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,16384,0.2883584022521973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,10240,0.19336533546447754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,8192,0.15482773780822753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,7168,0.14103892644246419
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,6144,0.12564693291982015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,5120,65536,1.383082707722982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,4096,0.08891733487447104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,5120,0.11182080109914143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,3584,0.08243199984232584
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,2560,0.06359039942423503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,3072,0.07151786486307779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,1024,0.03467839956283569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,2048,0.05447573264439901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,1536,0.04498773415883382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,768,0.03017279903093974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,256,0.02717120051383972
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,512,0.02805759906768799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,128,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,12288,0.1983477274576823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,16384,0.26241706212361654
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,10240,0.17175893783569335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,8192,0.14172159830729167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,7168,0.12598613103230794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,6144,0.1162922700246175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,4096,65536,1.118890635172526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,4096,0.08277333577473958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,5120,0.10113706588745117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,3584,0.07423893610636392
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,2560,0.05765120188395182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,3072,0.06686826546986899
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,2048,0.04870826800664266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,1024,0.032153600454330446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,1536,0.04102720022201538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,256,0.025464532772699992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,512,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,768,0.027853866418202717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,128,0.023822933435440063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,12288,0.1950719992319743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,16384,0.25920853614807127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,10240,0.16957227389017743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,8192,0.13981013298034667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3584,65536,0.9713674545288086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,7168,0.12445013523101807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,6144,0.11448319753011067
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,5120,0.10018133322397868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,4096,0.08044906457265219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,3584,0.07430826822916667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,3072,0.06516053279240927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,1536,0.03979839881261189
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,2048,0.04754879872004191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,2560,0.0559445341428121
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,512,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,768,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,1024,0.03031040032704671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,256,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,128,0.02369173367818197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,12288,0.1762645403544108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,16384,0.2216277281443278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,10240,0.15305280685424805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,8192,0.12137813568115234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,3072,65536,0.9855658849080404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,7168,0.11284480094909669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,6144,0.1000106652577718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,5120,0.09239892959594727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,3584,0.06577599843343099
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,4096,0.0731818675994873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,3072,0.059699201583862306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,2048,0.043009066581726076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,2560,0.05065493186314901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,1536,0.03577173153559367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,768,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,512,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,1024,0.027854933341344194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,128,0.022392533222834268
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,256,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,12288,0.14773227373758951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,16384,0.1958229382832845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,10240,0.1297749360402425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,8192,0.10851199626922607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,7168,0.0964949369430542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2560,65536,0.8310431798299154
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,6144,0.09018026987711589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,3584,0.05894720156987508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,4096,0.06461439927419027
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,5120,0.07963519891103109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,2048,0.037409067153930664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,3072,0.051950931549072266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,2560,0.045124268531799315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,1024,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,1536,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,256,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,512,0.020595200856526694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,128,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,16384,0.15974292755126954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,12288,0.12455253601074219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,65536,0.716049067179362
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,8192,0.09062293370564779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,10240,0.11021653016408284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,7168,0.08400320212046306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,6144,0.07635626792907715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,4096,0.05533013343811035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,5120,0.07062293688456217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,3584,0.05109759966532389
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,3072,0.04491946697235107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,2560,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,2048,0.03222186764081319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,1024,0.021230934063593547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,1536,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,512,0.01813760002454122
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,768,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,256,0.01950613260269165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,128,0.020002132654190062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1536,65536,0.5992448170979817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,16384,0.13175466855367024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,12288,0.10489173730214436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,8192,0.07611733277638753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,10240,0.09226240317026774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,7168,0.07086186408996582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,6144,0.06509226560592651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,4096,0.04713813463846843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,5120,0.059903999169667564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,3584,0.04259733359018962
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,3072,0.037273601690928145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,2048,0.027306665976842243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,2560,0.031947733958562215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,1024,0.01767146587371826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,1536,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,512,0.01568000018596649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,768,0.015620266397794088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,256,0.01807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,128,0.01726079980532328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,1024,65536,0.4704597473144531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,16384,0.13154880205790204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,10240,0.09188693364461263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,12288,0.10219519933064777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,7168,0.06942613124847412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,8192,0.07512746651967367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,6144,0.06471680005391439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,5120,0.06038293441136679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,2048,768,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,3584,0.0423253337542216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,4096,0.04642026821772258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,3072,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,2048,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,2560,0.031402667363484696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,1536,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,1024,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,768,0.015209600329399109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,512,0.01565120021502177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,256,0.01766080061594645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,128,0.01726079980532328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,768,65536,0.47503360112508136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,12288,0.08007573286692302
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,16384,0.09925973415374756
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,10240,0.07301119963328043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,8192,0.05928959846496582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,7168,0.05539733171463013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,6144,0.05253013372421265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,5120,0.048742401599884036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,4096,0.03686399857203166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,3584,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,3072,0.028807467222213744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,2560,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,2048,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,1024,0.01444906691710154
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,1536,0.018078933159510292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,256,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,512,0.013699199755986533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,768,0.013222400347391763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,128,0.016032000382741295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,12288,0.07881386280059814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,16384,0.09919040203094483
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,10240,0.07137280305226644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,8192,0.058950400352478026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,512,65536,0.3526986757914225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,6144,0.05164586702982584
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,7168,0.05553493499755859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,5120,0.04756053288777669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,4096,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,3584,0.032085333267847696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,3072,0.02778559923171997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,2048,0.020948266983032225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,2560,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,768,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,1024,0.014390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,1536,0.01767146587371826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,512,0.013597866892814637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,256,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,128,0.015687466661135355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,12288,0.08441173235575358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,16384,0.10199039777119953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,256,65536,0.3421866734822591
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,7168,0.056081068515777585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,10240,0.07625386714935303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,8192,0.059562667210896814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,4096,0.03624746799468994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,5120,0.04949333270390828
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,6144,0.05259946584701538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,2560,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,3584,0.03324586749076843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,3072,0.029214932521184282
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,2048,0.02136853337287903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,1536,0.018077866236368815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,1024,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,512,0.013572266697883606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,768,0.012742400169372559
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,256,0.016028799613316855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,128,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8192,128,65536,0.35754667917887367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,8192,0.8793098449707031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,10240,1.1065685272216796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,12288,1.287167994181315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,7168,0.811622428894043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,6144,0.6988458633422852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,16384,1.716497039794922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,5120,0.5949440002441406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,4096,0.4913493474324544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,3584,0.43465280532836914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,3072,0.3764224052429199
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,2560,0.33174187342325845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,768,0.1544874668121338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,1024,0.1792682647705078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,512,0.13714879353841145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,256,0.10820266405741374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,1536,0.2409813404083252
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,128,0.09359359741210938
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,65536,2048,0.28624213536580406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,10240,0.31368427276611327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,12288,0.36259838740030925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,16384,0.4904608090718587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,8192,0.25402026176452636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,7168,0.22517654101053872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,6144,0.20066986083984376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,5120,0.17251092592875164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,4096,0.13933226267496746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,2560,0.09693866570790609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,3072,0.11240106423695881
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,3584,0.12718186378479004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,1024,0.05458026727040609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,1536,0.07092906634012858
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,2048,0.08338773250579834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,512,0.04389760096867879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,768,0.048401065667470294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,256,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,128,0.03317760030428569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,12288,0.29764267603556316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,16384,0.3816789309183756
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,10240,0.25367892583211266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,8192,0.20094292958577475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,7168,0.18479785919189454
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,6144,0.158788267771403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,5120,0.1416533311208089
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,4096,0.11229866345723469
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,3584,0.1040725310643514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,3072,0.09000960191090902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,2048,0.06778879960378012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,2560,0.08093012968699137
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,1024,0.045125333468119304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,1536,0.05710506836573283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,768,0.039867734909057616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,512,0.03604480028152466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,256,0.030377600590387983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,128,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,16384,0.32180906931559244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,16384,65536,1.9914080301920574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,12288,0.24500907262166344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,10240,0.20770133336385094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,8192,0.17032532691955565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,12288,65536,1.524667739868164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,7168,0.15100587209065755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,5120,0.11946667035420735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,6144,0.13475839296976727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,4096,0.09478826522827148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,3072,0.07703893184661866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,3584,0.08768853346506754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,2560,0.06710506280263265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,1536,0.04904959996541341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,2048,0.05799253384272257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,768,0.03522666692733765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,1024,0.03822933435440064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,512,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,128,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,256,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,12288,0.20968213081359863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,16384,0.2705418586730957
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,10240,0.17571840286254883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,10240,65536,1.2305408477783204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,8192,0.13786452611287434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,6144,0.1119605302810669
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,7168,0.12670400142669677
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,5120,0.09625600179036459
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,3072,0.0636245330174764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,3584,0.07212373415629068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,4096,0.08065706888834635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,1536,0.04089173475901286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,2048,0.04829866488774617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,2560,0.05584213336308798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,512,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,768,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,1024,0.032631466786066696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,256,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,128,0.021912533044815063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,12288,0.18240853945414226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,16384,0.23620373407999673
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,10240,0.15387306213378907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,8192,0.12148053646087646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,7168,0.11154666741689045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,6144,0.09748373031616211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,5120,0.08789333502451578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,4096,0.07045119603474935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,3072,0.05744533141454061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,3584,0.06461439927419027
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,2048,0.042803200085957845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,2560,0.04980053504308064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,1024,0.029148799180984498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,1536,0.036659200986226395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,768,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,512,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,256,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,128,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,8192,65536,1.0420565287272134
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,12288,0.17462612787882487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,16384,0.23531519571940102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,10240,0.14970773061116535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,8192,0.12369919617970784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,7168,0.10909012953440349
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,6144,0.09878186384836832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,7168,65536,0.9126239776611328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,4096,0.07110079924265543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,5120,0.0850933313369751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,3584,0.06509013175964355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,2560,0.04829866488774617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,3072,0.056900266806284586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,2048,0.0423253337542216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,1024,0.027988266944885255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,1536,0.03461120128631592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,512,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,768,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,256,0.02067413330078125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,128,0.019308799505233766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,12288,0.1521663983662923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,16384,0.1964373270670573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,10240,0.13172053496042888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,8192,0.10478933652242024
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,7168,0.09721173445383707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,6144,0.08499200344085693
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,5120,0.07635626792907715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,4096,0.06106559832890829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,3584,0.056081068515777585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,6144,65536,0.8437088012695313
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,3072,0.049459199110666915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,2048,0.03645439942677815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,1536,0.031196800867716472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,2560,0.04307839870452881
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,1024,0.025051732858022053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,512,0.021502933899561563
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,768,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,128,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,256,0.018888533115386963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,12288,0.1241429328918457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,16384,0.1658880074818929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,10240,0.10752000013987224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,8192,0.0897706667582194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,7168,0.0799402634302775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,6144,0.07403626441955566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,5120,0.06379520098368327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,4096,0.0525984009106954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,5120,65536,0.7600469589233398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,2560,0.0373418649037679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,3072,0.042122666041056314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,3584,0.046830932299296066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,1024,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,2048,0.03242666721343994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,1536,0.027033599217732747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,256,0.017258665959040322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,768,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,512,0.019368533293406168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,128,0.01644159952799479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,12288,0.1048906644185384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,16384,0.13663466771443683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,10240,0.09178240299224853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,8192,0.075708802541097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,6144,0.062395731608072914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,7168,0.06857386430104574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,4096,65536,0.6187338511149089
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,4096,0.04382719993591309
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,5120,0.055124266942342126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,3584,0.03973120053609212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,3072,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,2560,0.031948800881703696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,2048,0.026898133754730224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,1024,0.01930026610692342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,1536,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,768,0.018489599227905273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,512,0.017318399747212727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,256,0.016847999890645345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,128,0.01609813372294108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,12288,0.10199146270751953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,16384,0.13271040121714275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,10240,0.089629864692688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,8192,0.07389866511027018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3584,65536,0.4930570602416992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,5120,0.05259946584701538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,6144,0.06113280057907104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,7168,0.06823146343231201
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,4096,0.04348586797714234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,3584,0.03952639897664388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,3072,0.03502080043156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,1536,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,2048,0.026761599381764728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,2560,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,512,0.01684266726175944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,768,0.018080000082651773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,1024,0.01882879932721456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,256,0.015201066931088766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,128,0.01548479994138082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,12288,0.10390186309814453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,16384,0.13038933277130127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,10240,0.09076053301493327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,8192,0.07226026852925618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,3072,65536,0.4948309262593587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,7168,0.06850666999816894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,6144,0.059562667210896814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,5120,0.053623465696970615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,4096,0.043484799067179364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,3584,0.03829760154088338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,3072,0.03543039957682292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,2560,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,1536,0.023345067103703817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,2048,0.026146133740743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,512,0.016569599509239197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,768,0.017866667111714682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,128,0.014517333110173544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,256,0.014883200327555338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,16384,0.09983999729156494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,12288,0.07874560356140137
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,65536,0.4845909436543782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,10240,0.06980266571044921
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,8192,0.05833386580149332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,6144,0.047172268231709794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,7168,0.05287466843922933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,4096,0.03420159816741943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,5120,0.04232639869054158
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,3584,0.031128533681233722
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,3072,0.028126933177312213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,2560,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,2048,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,1536,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,1024,0.015205333630243937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,768,0.015201066931088766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,512,0.014390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,256,0.013562666376431784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,128,0.013196800152460733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2048,65536,0.36915305455525715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,16384,0.09980586369832357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,12288,0.08164693514506022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,8192,0.05802666743596395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,10240,0.0694602648417155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,6144,0.0474453330039978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,5120,0.04246079921722412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,4096,0.0341322660446167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,3584,0.03160533308982849
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,3072,0.027922133604685467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,2560,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,2048,0.021766400337219237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,1536,0.018487467368443807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,1024,0.015075199802716575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,65536,0.35822931925455725
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,768,0.014801067113876343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,512,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,256,0.013366400202115377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,128,0.012937600413958231
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,16384,0.06990506649017333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,12288,0.05601386626561483
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,10240,0.0518175999323527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,8192,0.041300264994303386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,2560,1024,0.018487467368443807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,7168,0.03795520067214966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,6144,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,4096,0.025462400913238526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,5120,0.030789333581924438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,65536,0.24350825945536295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,3072,0.020594133933385213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,3584,0.02300693392753601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,2560,0.018898133436838785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,1536,0.014389333128929139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,2048,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,1024,0.012366933623949687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,512,0.012403200070063274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,768,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,256,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1024,128,0.011615999539693196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,12288,0.05502293507258097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,16384,0.06901760101318359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,10240,0.050279466311136875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,8192,0.040209066867828366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,7168,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,6144,0.03351893424987793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,5120,0.029148799180984498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,4096,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,3584,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,3072,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,2560,0.01813760002454122
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,2048,0.01602773368358612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,1536,0.014007467031478881
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,1024,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,768,0.012198399504025776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,512,0.012014933427174886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,256,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,128,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,768,65536,0.236680539449056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,12288,0.055606400966644286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,16384,0.06857279936472574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,10240,0.0504149317741394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,8192,0.03972906668980916
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,6144,0.03242666721343994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,7168,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,4096,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,5120,0.02969493269920349
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,3584,0.022256000836690267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,3072,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,2560,0.018077866236368815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,2048,0.016028799613316855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,1536,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,1024,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,768,0.012001066406567892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,512,0.012288000186284382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,256,0.011516799529393513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,65536,0.23340373039245604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,512,128,0.011468799908955891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,12288,0.05509119828542074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,16384,0.0680298646291097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,8192,0.03850239912668864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,10240,0.05007359981536865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,7168,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,6144,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,5120,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,4096,0.023824000358581544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,1536,7168,0.05348693529764811
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,3584,0.021826134125391642
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,3072,0.019784533977508546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,2560,0.0181386669476827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,2048,0.01601920028527578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,1024,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,1536,0.013858133554458618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,768,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,512,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,256,0.011523200074831645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,128,0.011310933033625285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,256,65536,0.23490559260050453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,12288,0.054306133588155114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,10240,0.048844798405965166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,16384,0.06816426912943521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,7168,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,8192,0.03816106716791789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,6144,0.032017066081364946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,4096,0.023826134204864503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,5120,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,3584,0.02177600065867106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,3072,0.019798400004704793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,2560,0.01773866613705953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,2048,0.01592639982700348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,1536,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,1024,0.01162559986114502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,768,0.011935999989509583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,512,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,256,0.011555199821790058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,128,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4096,128,65536,0.23606613477071128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,8192,0.44830719629923504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,10240,0.5518346786499023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,12288,0.6768639882405598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,7168,0.39976959228515624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,6144,0.35590826670328773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,16384,0.8445962905883789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,5120,0.30535573959350587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,4096,0.2544981320699056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,3584,0.22470080057779945
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,3072,0.1965727965037028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,2560,0.17312426567077638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,768,0.08215893109639485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,1024,0.09403626918792725
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,1536,0.12417706648508708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,128,0.05048319896062216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,2048,0.14820586840311686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,256,0.057241598765055336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,65536,512,0.0723626693089803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,10240,0.15994879404703777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,12288,0.18356906572977702
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,16384,0.24466880162556967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,8192,0.1301514705022176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,7168,0.11427840391794841
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,6144,0.10318613052368164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,4096,0.07294507026672363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,5120,0.0897706667582194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,3584,0.06754986445109049
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,2560,0.05290666818618774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,3072,0.05908480087916056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,1024,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,1536,0.03857066631317139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,2048,0.046353065967559816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,256,0.021076265970865884
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,768,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,512,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,128,0.01950506567955017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,12288,0.1643178621927897
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,16384,0.21439146995544434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,10240,0.1404586633046468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,8192,0.11441493034362793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,7168,0.10267199675242107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,6144,0.09018026987711589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,5120,0.07970133622487387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,4096,0.064955735206604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,3072,0.052121599515279136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,3584,0.0590826670328776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,2048,0.03993599812189738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,2560,0.046011734008789065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,1024,0.02764799992243449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,1536,0.034134399890899655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,768,0.02430400053660075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,512,0.021913599967956544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,128,0.017246933778127034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,256,0.01843199928601583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,16384,0.18165760040283202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,16384,65536,0.9153535842895508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,12288,0.13970774014790852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,10240,0.11694080034891766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,8192,0.0973141352335612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,12288,65536,0.771174430847168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,7168,0.0863925298055013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,6144,0.07813119888305664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,5120,0.066594131787618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,4096,0.05536426703135172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,3072,0.045124268531799315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,3584,0.0506880005200704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,2560,0.039665067195892335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,1536,0.02969599962234497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,2048,0.034473601977030435
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,1024,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,512,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,256,0.016847999890645345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,768,0.02218559980392456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,128,0.015610667069753012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,12288,0.11182080109914143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,16384,0.14909440676371258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,10240,0.09615466594696045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,8192,0.08099839687347413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,10240,65536,0.6699008305867513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,5120,0.05676159858703613
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,7168,0.07178239822387696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,6144,0.06529706716537476
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,3072,0.0385696013768514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,3584,0.042871467272440594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,4096,0.04792319933573405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,2048,0.029491200049718218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,1536,0.02553279995918274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,2560,0.034474666913350424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,512,0.017192532618840538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,768,0.019435733556747437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,1024,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,128,0.014450132846832275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,256,0.01514240006605784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,12288,0.09117013613382975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,16384,0.11803413232167562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,10240,0.07898560365041098
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,8192,0.06591253280639649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,7168,0.059494400024414064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,6144,0.05369173288345337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,4096,0.039867734909057616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,5120,0.04686506589253743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,3072,0.03242666721343994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,3584,0.03638506730397542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,2048,0.02505279978116353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,2560,0.02874133388201396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,8192,65536,0.5430613199869792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,1536,0.02204906741778056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,1024,0.018158932526906334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,768,0.01657600005467733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,256,0.014393599828084311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,512,0.014859732985496522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,128,0.014050133029619851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,12288,0.08908800284067789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,16384,0.11700906753540039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,10240,0.07710933685302734
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,8192,0.06553599834442139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,6144,0.05290666818618774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,7168,0.05887893438339233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,5120,0.04734293222427368
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,4096,0.038365864753723146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,7168,65536,0.4339029312133789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,3072,0.031948800881703696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,3584,0.03583999872207642
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,2560,0.028125866254170732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,1536,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,1024,0.01806933283805847
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,2048,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,512,0.014725333452224732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,768,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,256,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,128,0.012813867131868998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,12288,0.08816533088684082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,16384,0.11427840391794841
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,10240,0.07652693589528402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,8192,0.0634549339612325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,7168,0.057240533828735354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,6144,0.052121599515279136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,5120,0.04450986782709758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,4096,0.03816106716791789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,3072,0.030653866132100423
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,3584,0.0341322660446167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,6144,65536,0.43513174057006837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,2048,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,1536,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,2560,0.027512532472610474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,768,0.016032000382741295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,1024,0.01765973369280497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,512,0.014457600315411887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,128,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,256,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,12288,0.067413330078125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,16384,0.08290987014770508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,10240,0.05894933144251505
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,8192,0.04802560011545817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,7168,0.04450986782709758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,6144,0.039051731427510575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,4096,0.029148799180984498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,5120,0.03502080043156942
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,5120,65536,0.4302165349324544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,2560,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,3584,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,3072,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,1024,0.014392532904942832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,1536,0.01725226640701294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,2048,0.019777067502339683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,256,0.011534933249155681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,768,0.013570132851600646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,512,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,128,0.010797866185506185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,12288,0.06813013553619385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,16384,0.08297812938690186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,10240,0.05925546487172445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,8192,0.047650134563446044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,7168,0.04450986782709758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,6144,0.03884373505910237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,4096,65536,0.3090421358744303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,4096,0.02867199977238973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,5120,0.034815998872121175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,3584,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,3072,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,2560,0.022281599044799805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,2048,0.01930453379948934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,1024,0.014519466956456503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,1536,0.01684266726175944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,256,0.011242666840553283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,512,0.01236799955368042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,768,0.013230933745702108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,128,0.010831999778747558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,12288,0.066594131787618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,16384,0.08386560281117758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,10240,0.05775359869003296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3584,65536,0.30637973149617515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,8192,0.04761600097020467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,6144,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,7168,0.042733867963155106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,5120,0.034474666913350424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,4096,0.02887679934501648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,3584,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,3072,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,1536,0.016849066813786825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,2048,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,2560,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,768,0.013187199831008911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,512,0.011932800213495891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,1024,0.014425599575042724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,256,0.011241599917411804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,128,0.01074026624361674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,12288,0.06720853646596273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,16384,0.0836949348449707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,10240,0.058266667524973545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,8192,0.04700053135553996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,3072,65536,0.3058346748352051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,7168,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,6144,0.03857066631317139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,5120,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,3584,0.025942399104436235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,4096,0.02874133388201396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,3072,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,2048,0.018897066513697304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,2560,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,1536,0.01684373418490092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,768,0.012845866878827415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,1024,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,512,0.011958400408426922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,256,0.010829866925875346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,128,0.010668800274531046
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,12288,0.04355413516362508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,16384,0.053350400924682614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,10240,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,8192,0.03160640001296997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,7168,0.029491200049718218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2560,65536,0.3030367851257324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,6144,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,3584,0.018549333016077675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,5120,0.02403200070063273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,4096,0.020126932859420778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,3072,0.01766293247540792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,2560,0.015624533096949259
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,2048,0.014050133029619851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,1024,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,1536,0.012780800461769104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,768,0.010806399583816528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,256,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,512,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,128,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,12288,0.04280426502227783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,16384,0.054237866401672365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,10240,0.03638720115025838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,8192,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,6144,0.026146133740743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,2048,65536,0.18776747385660808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,7168,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,4096,0.020118399461110433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,3584,0.018351999918619792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,5120,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,2048,0.01357439955075582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,3072,0.01731626590092977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,2560,0.015209600329399109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,1024,0.011173333724339802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,1536,0.012275200088818867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,768,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,512,0.010289067029953003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,256,0.00950933297475179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,128,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,12288,0.04137066602706909
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,16384,0.05307626724243164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,8192,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,10240,0.03549866676330567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1536,65536,0.1773567994435628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,7168,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,4096,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,3584,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,3072,0.016506666938463845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,2560,0.01493119994799296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,2048,0.013573333621025085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,1536,0.012035199999809265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,1024,0.011172266801198323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,768,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,512,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,256,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,128,0.009079466263453167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,12288,0.040277334054311116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,16384,0.05273600021998087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,1024,65536,0.17810773849487305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,10240,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,7168,0.02744320034980774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,8192,0.02956053415934245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,4096,0.019317332903544107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,6144,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,3072,0.01684160033861796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,3584,0.01766080061594645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,2560,0.014801067113876343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,1024,0.010807466506958009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,1536,0.012027733524640401
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,2048,0.013700266679128012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,512,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,256,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,768,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,128,0.009128533800443013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,768,65536,0.17585493723551432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,12288,0.03959253231684367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,16384,0.052239998181660974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,8192,0.029148799180984498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,7168,0.027100799481074016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,10240,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,5120,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,6144,0.024371200799942018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,4096,0.018897066513697304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,3072,0.016427733500798545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,3584,0.017681066195170084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,2560,0.014801067113876343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,2048,0.013220266501108805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,1536,0.011932800213495891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,1024,0.010706133643786113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,768,0.010289067029953003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,512,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,256,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,128,0.009060266613960265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,512,65536,0.1774250666300456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,12288,0.03932160139083862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,16384,0.051336534818013514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,8192,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,10240,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,7168,0.027033599217732747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,6144,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,4096,0.018966400623321535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,3072,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,3584,0.017933867375055947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,2560,0.014800000190734863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,1536,0.012061867117881774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,1024,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,768,0.010491733749707539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,65536,0.1773567994435628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,512,0.009885866443316143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,256,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,128,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,12288,0.039389868577321366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,16384,0.051950931549072266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,8192,0.02990079919497172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,10240,0.034474666913350424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,7168,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,6144,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,4096,0.018898133436838785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,5120,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,3072,0.01684266726175944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,3584,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,65536,0.17605973879496256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,2560,0.014858667055765787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,2048,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,1536,0.011526399850845337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,1024,0.010718933741251628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,768,0.010289067029953003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,512,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,256,0.009467732906341553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,128,128,0.009011200070381165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2048,256,2048,0.01325759987036387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,10240,0.3065845489501953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,12288,0.3528362592061361
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,8192,0.23981973330179848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,16384,0.46732053756713865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,7168,0.22169493039449056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,5120,0.1596757411956787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,6144,0.19172693888346354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,4096,0.13339306513468424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,3584,0.1217194636662801
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,2560,0.09413866996765137
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,3072,0.10417493184407552
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,768,0.04532800118128459
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,1024,0.05314559936523437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,1536,0.06720960140228271
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,256,0.03317760030428569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,128,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,512,0.040072532494862874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,65536,2048,0.07935893535614014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,10240,0.09226240317026774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,12288,0.10735039710998535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,16384,0.14424746831258137
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,7168,0.06813013553619385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,8192,0.07628906567891439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,6144,0.061850666999816895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,4096,0.04505600134531657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,5120,0.05300906499226889
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,3584,0.04123200178146362
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,3072,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,2560,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,1024,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,2048,0.02908160090446472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,1536,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,512,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,256,0.014016000429789224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,768,0.018204800287882485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,128,0.012822399536768595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,12288,0.08584533532460531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,16384,0.10779413382212322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,10240,0.07403519948323568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,8192,0.0594592014948527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,7168,0.05560319821039835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,6144,0.04881173372268677
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,5120,0.042940799395243326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,4096,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,3584,0.03331519961357117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,3072,0.030173865954081218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,2048,0.023893332481384276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,2560,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,1536,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,1024,0.016850133736928306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,512,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,768,0.015201066931088766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,256,0.012102400263150532
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,128,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,16384,0.10789546966552735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,16384,65536,0.5268138567606608
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,12288,0.0831157366434733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,10240,0.07458133697509765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,8192,0.05905066728591919
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,12288,65536,0.40987199147542314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,6144,0.04782293240229289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,7168,0.05570559899012247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,5120,0.04184746742248535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,3072,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,3584,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,4096,0.03536213239034017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,1536,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,2048,0.023619200785954794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,2560,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,1024,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,768,0.015067733327547708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,256,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,128,0.011241599917411804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,512,0.01316480040550232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,12288,0.06140693426132202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,16384,0.0801098664601644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,10240,0.053521064917246494
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,10240,65536,0.4136960029602051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,8192,0.04526079893112182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,6144,0.03652160167694092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,7168,0.040209066867828366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,5120,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,3072,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,4096,0.027854933341344194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,3584,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,1536,0.016166399916013083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,2048,0.018567466735839845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,2560,0.02141653299331665
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,768,0.012342400352160136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,1024,0.013229866822560629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,512,0.011547733346621196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,256,0.01039573351542155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,128,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,12288,0.06113280057907104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,16384,0.07789119879404703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,10240,0.0527018666267395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,8192,0.04375893274943034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,7168,0.039662933349609374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,6144,0.035905067125956217
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,4096,0.02764799992243449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,5120,0.032017066081364946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,3584,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,2048,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,1536,0.016034133235613503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,1024,0.013172266880671182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,768,0.012001066406567892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,512,0.010706133643786113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,256,0.009896533687909444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,128,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,8192,65536,0.2808490753173828
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,12288,0.0606549342473348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,16384,0.07700800100962321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,10240,0.05191680192947388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,8192,0.0437610665957133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,7168,0.039459200700124104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,6144,0.035427200794219973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,5120,0.031948800881703696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,7168,65536,0.28317012786865237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,4096,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,3072,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,3584,0.024985599517822265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,2560,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,1536,0.01581760048866272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,2048,0.018480000893274943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,1024,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,768,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,512,0.01071679989496867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,256,0.009987200299898785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,128,0.00960533320903778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,12288,0.0602453351020813
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,16384,0.07744853496551514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,10240,0.05218986670176188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,8192,0.043211734294891356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,7168,0.039255468050638835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,6144,0.03577173153559367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,5120,0.0315391997496287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,3584,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,3072,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,2560,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,6144,65536,0.28282880783081055
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,2048,0.017670400937398276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,1536,0.015611732999483744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,1024,0.012754133343696595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,768,0.01162559986114502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,256,0.009884799520174663
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,512,0.010674132903416952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,128,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,12288,0.037342933813730876
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,16384,0.04679679870605469
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,10240,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,8192,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,7168,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,6144,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,4096,0.018549333016077675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,5120,65536,0.28344319661458334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,5120,0.021230934063593547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,3072,0.016056533654530844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,3584,0.016908800601959227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,2560,0.014390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,1536,0.01165120005607605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,1024,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,2048,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,256,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,768,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,512,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,128,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,12288,0.03768320083618164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,16384,0.045124268531799315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,10240,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,8192,0.027512532472610474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,7168,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,6144,0.023346134026845298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,4096,65536,0.1617919921875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,5120,0.021347200870513915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,4096,0.018077866236368815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,3584,0.016847999890645345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,3072,0.015612799922625223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,2560,0.014050133029619851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,2048,0.012786133090655008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,1536,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,1024,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,768,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,512,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,256,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,128,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,12288,0.03672746817270915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,16384,0.045670398076375324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3584,65536,0.15428266525268555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,10240,0.032630399862925215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,8192,0.02744320034980774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,6144,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,7168,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,5120,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,3584,0.016501333316167197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,4096,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,3072,0.015210666259129844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,2560,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,2048,0.012684800227483115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,1536,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,768,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,1024,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,512,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,128,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,256,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,12288,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,16384,0.044647467136383054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,10240,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,8192,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,3072,65536,0.15482880274454752
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,7168,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,6144,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,5120,0.020615466435750327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,4096,0.01767146587371826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,3584,0.016088533401489257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,3072,0.01530346671740214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,2048,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,2560,0.013585066795349121
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,1536,0.011241599917411804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,768,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,512,0.009057066837946574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,256,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,128,0.008273066580295562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,16384,0.045398398240407305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,65536,0.15086933771769206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,12288,0.03577173153559367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,8192,0.02635093331336975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,10240,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,7168,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,6144,0.021912533044815063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,5120,0.020205867290496827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,4096,0.01726079980532328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,3584,0.016189866264661155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,3072,0.014869333306948344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,2560,0.013665067156155905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,2048,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,1536,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,1024,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,768,0.009467732906341553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,512,0.00886400043964386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,256,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,128,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2048,65536,0.15107626914978028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,16384,0.043484799067179364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,12288,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,8192,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,10240,0.030239999294281006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,7168,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,6144,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,4096,0.016951467593510947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,5120,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,3072,0.014801067113876343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,3584,0.015961600343386333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,2560,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,2048,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,1536,0.010803199807802836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,1024,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,768,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,512,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,256,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,128,0.007906133433183034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1536,65536,0.15114240646362304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,16384,0.04266666571299235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,12288,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,10240,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,8192,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,7168,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,6144,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,5120,0.019308799505233766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,4096,0.017249067624409996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,3072,0.014793599645296732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,3584,0.015621333320935567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,2560,0.01363200048605601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,2048,0.012033067146937053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,1536,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,1024,0.009543466567993163
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,65536,0.15039146741231282
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,768,0.009467732906341553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,512,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,256,0.008282666901747386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,1024,128,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,12288,0.034542934099833174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,16384,0.04266666571299235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,8192,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,7168,0.023893332481384276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,6144,0.02135466734568278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,5120,0.019706666469573975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,3584,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,3072,0.014792533715566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,2560,0.013250133395195008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,65536,0.1491626739501953
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,2048,0.012060800194740295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,1536,0.010806399583816528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,1024,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,768,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,512,0.008714666962623597
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,256,0.008317866424719492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,128,0.007965866724650066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,16384,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,12288,0.034474666913350424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,10240,0.03051519989967346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,8192,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,7168,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,65536,0.14909440676371258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,2560,1024,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,6144,0.021824000279108684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,5120,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,4096,0.01684053341547648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,3584,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,3072,0.014390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,2048,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,2560,0.013255467017491659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,1536,0.010703999797503154
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,768,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,1024,0.00967039962609609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,512,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,256,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,512,128,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,12288,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,16384,0.04266666571299235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,10240,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,8192,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,6144,0.021432532866795858
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,7168,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,4096,0.017248000701268515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,5120,0.019297067324320474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,65536,0.14895787239074706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,3072,0.014450132846832275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,3584,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,2560,0.013264000415802002
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,2048,0.012026666601498922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,1536,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,768,0.009128533800443013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,1024,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,256,0.008343467116355896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,128,0.00790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,16384,0.04266666571299235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,12288,0.034065067768096924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,65536,0.14888960520426434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,10240,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,8192,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,7168,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,6144,0.021346133947372437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,5120,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,4096,0.01684053341547648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,3584,0.015620266397794088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,3072,0.014382933576901754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,2560,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,2048,0.01202880044778188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,1536,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,1024,0.00960106650988261
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,512,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,768,0.009052800138791402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,256,0.008260266482830047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,128,128,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,768,4096,0.01691626707712809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1024,256,512,0.00871573289235433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,12288,0.2815317471822103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,8192,0.19657386144002278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,10240,0.24371093114217124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,16384,0.36758292516072594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,5120,0.13042346636454266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,6144,0.15250773429870607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,7168,0.1710762659708659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,4096,0.10431146621704102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,2560,0.07424000104268393
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,3584,0.09687039852142335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,3072,0.08666453361511231
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,768,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,2048,0.0632149338722229
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,1024,0.042734932899475095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,128,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,256,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,1536,0.053350400924682614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,65536,512,0.03324480056762695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,10240,0.0734549363454183
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,12288,0.08304639657338461
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,16384,0.10625920295715333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,8192,0.06058773199717203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,7168,0.053453866640726724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,6144,0.04741013447443644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,4096,0.03583999872207642
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,5120,0.042734932899475095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,3584,0.032767999172210696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,2560,0.027510400613149005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,3072,0.029901866118113202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,1024,0.016851200660069784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,1536,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,2048,0.023552000522613525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,256,0.011549866199493409
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,768,0.014869333306948344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,512,0.01356160044670105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,128,0.0114464004834493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,12288,0.059495464960734046
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,16384,0.0788149356842041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,10240,0.051780267556508386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,8192,0.045124268531799315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,7168,0.03993493318557739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,6144,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,5120,0.03208426634470622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,4096,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,3072,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,3584,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,2048,0.018412800629933675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,2560,0.021572266022364298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,1024,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,1536,0.01601920028527578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,768,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,512,0.011037866274515789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,256,0.010288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,128,0.00947093367576599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,16384,0.07482133706410726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,16384,65536,0.41390078862508134
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,12288,0.05850453376770019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,8192,0.04266666571299235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,10240,0.051575465997060144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,12288,65536,0.289518928527832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,7168,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,6144,0.03549866676330567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,5120,0.03126613299051921
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,3072,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,4096,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,3584,0.02491733431816101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,1536,0.01616853376229604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,2048,0.01813973387082418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,2560,0.020808533827463786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,1024,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,768,0.012025599678357441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,512,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,256,0.009920000036557516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,16384,0.07567359606424967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,65536,0.2807807922363281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,12288,0.05911893447240194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,10240,0.05246293147404989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,8192,0.04307626485824585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,7168,0.04007360140482585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,6144,0.03495253324508667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,5120,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,3584,0.02512213389078776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,3072,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,10240,128,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,2048,0.01835413376490275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,1536,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,1024,0.012778666615486146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,512,0.010718933741251628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,768,0.011591466267903645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,256,0.010013866424560546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,128,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,12288,0.0606549342473348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,16384,0.07461333274841309
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,10240,0.0524288018544515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,8192,0.0423253337542216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,8192,65536,0.2758655865987142
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,7168,0.04020800193150838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,5120,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,6144,0.034474666913350424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,3584,0.024235733350118003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,3072,0.02177600065867106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,4096,0.027306665976842243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,1536,0.015714133779207863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,2048,0.01766293247540792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,2560,0.019715199867884316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,1024,0.012813867131868998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,768,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,512,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,256,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,128,0.009498666723569233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,12288,0.03618133465449015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,16384,0.04642133315404256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,10240,0.032290132840474446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,8192,0.028329600890477497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,7168,0.02539413372675578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,6144,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,5120,0.020936532815297445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,4096,0.0187882661819458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,3584,0.01704746683438619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,3072,0.016088533401489257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,2048,0.012878933548927307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,2560,0.014383999506632486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,1024,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,1536,0.01165226697921753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,768,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,512,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,128,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,256,0.008444799979527792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,7168,65536,0.2800640106201172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,12288,0.03638720115025838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,16384,0.04389546712239583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,10240,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,8192,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,7168,0.02491733431816101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,6144,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,4096,0.017796266078948974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,6144,65536,0.15974507331848145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,3584,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,3072,0.015211733182271323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,1536,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,2048,0.012333866953849793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,2560,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,1024,0.009486933549245197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,768,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,512,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,128,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,256,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,12288,0.03543146848678589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,16384,0.04300800164540609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,10240,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,8192,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,7168,0.024233599503835045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,6144,0.02177600065867106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,4096,0.01725013256072998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,5120,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,5120,65536,0.15510080655415853
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,3584,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,2560,0.014005333185195923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,3072,0.014803199966748556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,1024,0.009545600414276123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,1536,0.011175466577212016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,2048,0.011994666854540507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,768,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,512,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,256,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,128,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,12288,0.034065067768096924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,16384,0.04266666571299235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,10240,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,8192,0.025805866718292235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,6144,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,7168,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,4096,65536,0.14499732653299968
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,4096,0.01726079980532328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,5120,0.019709867238998414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,3584,0.01569066643714905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,3072,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,2560,0.013222400347391763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,2048,0.011934933066368104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,1024,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,1536,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,768,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,512,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,256,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,128,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,12288,0.03433813254038493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,16384,0.042940799395243326
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3584,65536,0.14629440307617186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,10240,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,8192,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,5120,0.019317332903544107
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,7168,0.023824000358581544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,6144,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,3072,0.014390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,3584,0.016023466984430947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,4096,0.016847999890645345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,1536,0.010737066467603047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,2048,0.012334932883580525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,2560,0.013196800152460733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,768,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,1024,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,512,0.00865600009759267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,256,0.008236800134181977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,128,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,12288,0.03378986517588298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,16384,0.0423253337542216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,10240,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,8192,0.025462400913238526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,3072,65536,0.14281387329101564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,7168,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,6144,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,5120,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,4096,0.016849066813786825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,3584,0.01568000018596649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,3072,0.014383999506632486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,2048,0.012060800194740295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,2560,0.01316373348236084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,1536,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,1024,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,512,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,768,0.009079466263453167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,128,0.007863466441631318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,256,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,12288,0.03372373183568318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,16384,0.04184746742248535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,10240,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,8192,0.02471359968185425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,7168,0.02300693392753601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,6144,0.020756266514460244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2560,65536,0.14287999471028645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,4096,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,5120,0.01895893414815267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,3584,0.015210666259129844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,2560,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,3072,0.01397546629110972
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,2048,0.011557333668073018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,1024,0.009467732906341553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,1536,0.01069760024547577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,768,0.008726400136947633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,512,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,256,0.008235733211040496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,128,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,12288,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,16384,0.04171200195948283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,10240,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,8192,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,6144,0.020529067516326903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,7168,0.02218559980392456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,2048,65536,0.14397546450297039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,5120,0.01889066696166992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,4096,0.01609813372294108
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,3584,0.015209600329399109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,3072,0.014416000247001648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,2048,0.011591466267903645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,2560,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,1536,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,1024,0.00951039989789327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,768,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,256,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,512,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,128,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,12288,0.03242773413658142
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,16384,0.04123306671778361
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1536,65536,0.1422005335489909
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,10240,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,7168,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,6144,0.020595200856526694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,5120,0.01835306684176127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,4096,0.01609173317750295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,3584,0.015271466970443726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,3072,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,2560,0.012743467092514038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,2048,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,1536,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,1024,0.009128533800443013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,768,0.009040000041325887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,256,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,512,0.0083146666487058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,128,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,12288,0.03283626635869344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,1024,65536,0.1432917277018229
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,16384,0.04061866601308187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,10240,0.028945066531499225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,8192,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,7168,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,6144,0.020595200856526694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,5120,0.018488534291585288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,4096,0.016028799613316855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,3072,0.013705600301424661
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,3584,0.015202132860819497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,2560,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,1536,0.010696533322334289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,2048,0.011591466267903645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,768,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,512,0.008523733417193095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,256,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,128,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,768,65536,0.1421984036763509
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,12288,0.03290666739145915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,10240,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,16384,0.04061866601308187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,7168,0.02218559980392456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,8192,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,6144,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,4096,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,5120,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,3584,0.014798933267593383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,2560,0.012743467092514038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,3072,0.01418239971001943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,2048,0.011592533191045125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,1536,0.01042133371035258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,1024,0.009532800316810608
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,768,0.008725333213806152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,512,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,256,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,128,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,512,65536,0.14349652926127116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,16384,0.04143786827723185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,12288,0.032425600290298465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,10240,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,8192,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,6144,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,7168,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,5120,0.018544000387191773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,4096,0.016032000382741295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,3584,0.014812800288200378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,3072,0.01428053379058838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,65536,0.1423360029856364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,2560,0.012786133090655008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,2048,0.011525332927703857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,1536,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,1024,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,256,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,512,0.008282666901747386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,256,128,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,10240,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,16384,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,12288,0.03201919992764791
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,8192,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,6144,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,5120,0.018103466431299845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,4096,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,65536,0.14254080454508464
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,3584,0.014800000190734863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,3072,0.013994666934013366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,2560,0.01283093293507894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,2048,0.011333333452542622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,1536,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,1024,0.009127466877301534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,768,0.008785067001978557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,512,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,128,0.007696000238259633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,768,128,256,0.007833600044250488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,8192,0.12929706573486327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,10240,0.15571519533793132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,12288,0.19172693888346354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,7168,0.11489280064900716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,6144,0.09878186384836832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,16384,0.24760212898254394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,5120,0.08751786549886068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,4096,0.07137386798858643
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,3584,0.06413653294245401
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,2560,0.051370668411254886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,3072,0.0589141329129537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,1024,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,768,0.02717120051383972
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,1536,0.037614933649698895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,2048,0.04457813501358032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,128,0.018071466684341432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,256,0.02018666664759318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,65536,512,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,10240,0.05116586685180664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,12288,0.059903999169667564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,16384,0.07359146277109782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,8192,0.04280426502227783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,7168,0.039933868249257404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,6144,0.03515733480453491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,4096,0.027215999364852906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,5120,0.0315391997496287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,3584,0.024577067295710246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,3072,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,2560,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,1024,0.013363200426101684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,1536,0.016090666254361473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,2048,0.018295466899871826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,256,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,768,0.011603200435638427
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,512,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,128,0.00949013332525889
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,12288,0.057615999380747476
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,16384,0.07560640176137289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,10240,0.05017600059509277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,8192,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,7168,0.038091735045115156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,6144,0.03518506685892741
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,5120,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,4096,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,3072,0.02259520093599955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,3584,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,2048,0.017321600516637167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,2560,0.020529067516326903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,1536,0.015204266707102457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,1024,0.01276586651802063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,512,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,768,0.011617066462834676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,256,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,128,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,16384,0.07331840197245279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,16384,65536,0.27709439595540364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,12288,0.05785706837972006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,10240,0.05058559974034628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,8192,0.04177813529968262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,12288,65536,0.2717013359069824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,7168,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,6144,0.03413333495457967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,5120,0.030377600590387983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,3072,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,4096,0.02621440092722575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,3584,0.023961599667867026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,1536,0.014860799908638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,2048,0.017257599035898845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,2560,0.019718400637308755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,1024,0.012266666690508524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,768,0.011142399907112122
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,256,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,512,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,128,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,12288,0.035021865367889406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,16384,0.043144532044728595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,10240,0.03099306623140971
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,8192,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,10240,65536,0.2742272059122721
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,7168,0.024370133876800537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,5120,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,6144,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,3584,0.01690666675567627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,4096,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,3072,0.015213867028554281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,1536,0.010805333654085796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,2048,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,2560,0.014006400108337402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,512,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,1024,0.00950933297475179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,768,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,128,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,256,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,12288,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,16384,0.04225813150405884
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,10240,0.03065173427263896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,8192,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,7168,0.024301866690317787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,6144,0.021915733814239502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,5120,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,4096,0.017259732882181803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,3584,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,3072,0.014593066771825156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,2560,0.013597866892814637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,2048,0.01200213332970937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,1024,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,1536,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,768,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,512,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,128,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,256,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,8192,65536,0.1442464033762614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,12288,0.03345066706339518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,16384,0.042461868127187094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,10240,0.02921813329060872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,8192,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,6144,0.021571199099222817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,7168,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,7168,65536,0.13963839213053386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,4096,0.01684160033861796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,5120,0.019715199867884316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,2560,0.013160533706347146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,3072,0.014043733477592468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,3584,0.015621333320935567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,1024,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,1536,0.010388267040252686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,2048,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,512,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,768,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,256,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,128,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,12288,0.03290560046831767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,16384,0.04177813529968262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,10240,0.028946133454640706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,8192,0.02539520064989726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,7168,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,6144,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,5120,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,4096,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,6144,65536,0.13977173169453938
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,3584,0.015201066931088766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,3072,0.013979732990264893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,1536,0.010396800438563029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,2560,0.013153066237767538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,2048,0.011583999792734782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,512,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,768,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,1024,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,256,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,128,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,12288,0.03324586749076843
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,16384,0.040209066867828366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,10240,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,8192,0.02450773318608602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,7168,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,6144,0.020273067553838096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,4096,0.01602453291416168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,5120,65536,0.1344853401184082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,5120,0.01930026610692342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,2560,0.01276586651802063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,3584,0.014794666568438211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,3072,0.013640532890955607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,1536,0.010388267040252686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,2048,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,256,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,512,0.008306133250395458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,128,0.007850666840871174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,12288,0.032494932413101196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,16384,0.03979839881261189
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,10240,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,8192,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,6144,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,4096,65536,0.1346901257832845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,5120,0.018549333016077675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,4096,0.016028799613316855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,3584,0.014871467153231302
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,3072,0.01397119959195455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,2048,0.011558399597803751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,2560,0.012411733468373615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,1536,0.010356266299883525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,256,0.008170666793982189
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,512,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,128,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,12288,0.031948800881703696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,16384,0.04020800193150838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3584,65536,0.1335637410481771
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,10240,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,8192,0.023824000358581544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,7168,0.02177813251813253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,6144,0.019992534319559732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,5120,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,4096,0.015682133038838704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,3072,0.013572266697883606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,3584,0.014800000190734863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,2048,0.011552000045776367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,2560,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,1536,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,768,0.008718933661778767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,256,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,12288,0.03208426634470622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,16384,0.03918399810791016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,10240,0.028125866254170732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,8192,0.023756800095240276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,3072,65536,0.1357141335805257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,7168,0.022120533386866252
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,6144,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,5120,0.018071466684341432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,3584,0.014441600441932679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,4096,0.015621333320935567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,3072,0.013633066415786743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,2048,0.01142080028851827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,2560,0.012401066223780314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,1536,0.010356266299883525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,768,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,512,0.008303999900817871
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,256,0.007895466685295106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,12288,0.03160853385925293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,16384,0.039389868577321366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,10240,0.027510400613149005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,8192,0.023277866840362548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2560,65536,0.13380160331726074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,6144,0.019592533508936562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,7168,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,3584,0.014389333128929139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,4096,0.015612799922625223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,5120,0.017667200167973837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,2560,0.012401066223780314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,3072,0.013572266697883606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,2048,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,1536,0.00997759997844696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,1024,0.009079466263453167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,512,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,128,0.007462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,12288,0.030789333581924438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,16384,0.039662933349609374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,10240,0.027100799481074016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,6144,0.019715199867884316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,7168,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,2048,65536,0.13489492734273273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,3584,0.014551466703414917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,4096,0.015621333320935567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,5120,0.017667200167973837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,3072,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,2048,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,1536,0.010286933183670044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,1024,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,768,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,512,0.008280533552169799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,256,0.00806826651096344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,128,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,16384,0.03870933453241984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,65536,0.1329482634862264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,10240,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,12288,0.030856533845265703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,8192,0.023414399226506552
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,7168,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,6144,0.01952426632245382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,5120,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,4096,0.015614933768908181
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,3584,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,3072,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,2560,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,65536,0.13469120661417644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,2048,0.01120746632417043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,1024,0.009467732906341553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,1536,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,768,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,512,0.008341333270072937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,128,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1024,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,12288,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,16384,0.03877439896265666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,10240,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,7168,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,6144,0.019718400637308755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,5120,0.017661867539087932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,4096,0.015481600165367126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,3584,0.014385066429773965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,3072,0.013193600376447043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,65536,0.13506560325622557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,2560,0.012333866953849793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,2048,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,1024,0.009127466877301534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,1536,0.010331733028093974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,512,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,256,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,768,128,0.0074314668774604796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,16384,0.03904853264490764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,10240,0.02757973273595174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,7168,0.02177813251813253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,6144,0.019718400637308755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,5120,0.01772800087928772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,4096,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,3584,0.014452266693115234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,3072,0.013229866822560629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,65536,0.13325653076171876
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,2560,0.012471466263135274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,1536,0.010013866424560546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,2048,0.011116799712181092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,1024,0.00940053363641103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,768,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,512,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,256,0.007863466441631318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,512,128,0.007484800120194752
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,16384,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,10240,0.027102933327356978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,7168,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,6144,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,4096,0.01567893326282501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,5120,0.017650133371353148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,65536,0.13428053855895997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,3072,0.013222400347391763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,3584,0.014518400033315023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,2560,0.012356266379356384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,2048,0.011174399654070537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,1536,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,1024,0.009032533566157023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,512,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,256,0.007834666470686594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,256,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,16384,0.03857066631317139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,10240,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,65536,0.13431466420491536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,7168,0.02136853337287903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,5120,0.01766080061594645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,6144,0.019308799505233766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,4096,0.015268266201019287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,3584,0.014792533715566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,2560,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,3072,0.01318186620871226
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,2048,0.011237333218256634
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,1536,0.009944533308347065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,1024,0.009065600236256917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,512,0.00823359986146291
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,256,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,128,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,512,1536,2560,0.01237546702226003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,10240,0.1362943967183431
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,8192,0.1130837361017863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,12288,0.16349867184956868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,6144,0.08826879660288492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,16384,0.21876053810119628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,7168,0.09762240250905355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,5120,0.07495786348978678
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,2560,0.04492053190867106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,3072,0.050312534968058265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,3584,0.05778773228327433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,4096,0.0630783994992574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,768,0.023825067281723022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,1536,0.03304106593132019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,1024,0.026829866568247478
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,128,0.016088533401489257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,2048,0.03925333420435588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,256,0.01684266726175944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,65536,512,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,10240,0.05061866839726766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,12288,0.05792426665623983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,16384,0.07417173385620117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,8192,0.042393600940704344
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,7168,0.037887998421986896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,6144,0.03413333495457967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,4096,0.02600746750831604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,5120,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,3072,0.022050132354100548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,3584,0.024166399240493776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,2560,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,1024,0.012411733468373615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,1536,0.015824000040690102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,2048,0.017730132738749186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,768,0.011524266997973124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,256,0.009539199868837993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,512,0.010307199756304423
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,128,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,12288,0.03583999872207642
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,16384,0.04450986782709758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,10240,0.031948800881703696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,8192,0.026898133754730224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,7168,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,6144,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,4096,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,5120,0.020617600282033285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,3072,0.015549866358439126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,3584,0.016588800152142844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,2048,0.012444800138473511
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,2560,0.01411733329296112
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,1024,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,1536,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,768,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,512,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,256,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,128,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,16384,0.042531200249989826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,16384,65536,0.27197440465291345
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,12288,0.0339957316716512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,8192,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,10240,0.03092479904492696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,12288,65536,0.15162132581075033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,5120,0.019730132818222047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,7168,0.023962666591008507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,6144,0.02218773365020752
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,3072,0.015201066931088766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,3584,0.01616853376229604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,4096,0.01731946667035421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,1536,0.010795733332633973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,2048,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,2560,0.013612799843152366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,1024,0.00951039989789327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,512,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,768,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,256,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,128,0.007828266421953837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,12288,0.03365439971288045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,16384,0.040755200386047366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,10240,65536,0.14424853324890136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,10240,0.02990079919497172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,8192,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,6144,0.021756800015767415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,7168,0.023414399226506552
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,5120,0.018978132804234823
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,3072,0.014043733477592468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,3584,0.016028799613316855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,4096,0.017249067624409996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,1536,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,2048,0.011929600437482198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,2560,0.013156267007191977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,512,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,768,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,1024,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,256,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,128,0.007835733393828075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,12288,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,16384,0.040482131640116374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,10240,0.029423999786376952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,8192,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,7168,0.022936532894770302
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,6144,0.020888533194859824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,4096,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,5120,0.0193066676457723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,3584,0.015268266201019287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,3072,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,2560,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,2048,0.011523200074831645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,1024,0.009352533022562663
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,1536,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,768,0.008725333213806152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,512,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,128,0.007694933315118153
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,8192,65536,0.133188263575236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,16384,0.040139734745025635
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,12288,0.03222613334655762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,8192,0.024233599503835045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,10240,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,7168,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,6144,0.02066346605618795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,7168,65536,0.13380160331726074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,4096,0.01609173317750295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,5120,0.018897066513697304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,3584,0.015267200271288552
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,3072,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,2560,0.012788266936937968
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,2048,0.011586133639017742
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,1024,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,1536,0.010354133447011311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,768,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,256,0.007997866471608479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,128,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,12288,0.032290132840474446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,16384,0.03979946772257487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,10240,0.028398933013280232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,8192,0.024233599503835045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,7168,0.022574933369954427
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,6144,0.020137600104014077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,5120,0.018480000893274943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,4096,0.015958399573961893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,3072,0.013668266932169595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,3584,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,6144,65536,0.13202773729960124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,2048,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,2560,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,1536,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,1024,0.009467732906341553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,768,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,256,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,128,0.007495466868082683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,12288,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,16384,0.039389868577321366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,10240,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,8192,0.023961599667867026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,7168,0.02157333294550578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,6144,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,5120,65536,0.12984320322672527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,4096,0.01567893326282501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,5120,0.01775146722793579
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,3584,0.014382933576901754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,3072,0.013562666376431784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,2560,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,2048,0.01120853324731191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,1536,0.010307199756304423
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,512,0.008306133250395458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,768,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,256,0.00787199983994166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,128,0.0074869334697723385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,12288,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,16384,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,10240,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,8192,0.023539199431737264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,7168,0.02177600065867106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,6144,0.019377066691716512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,4096,65536,0.13165226777394612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,5120,0.017798399925231932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,4096,0.015210666259129844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,3584,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,3072,0.013289599617322286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,2560,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,2048,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,1536,0.010290132959683736
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,1024,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,512,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,128,0.007463466624418895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,256,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,16384,0.03884479999542236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3584,65536,0.12980906963348388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,10240,0.027100799481074016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,8192,0.023552000522613525
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,7168,0.020958934227625528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,5120,0.017544533809026083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,6144,0.0193066676457723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,4096,0.015204266707102457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,3072,0.013195733229319254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,3584,0.014390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,1536,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,2560,0.012370133399963379
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,2048,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,768,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,1024,0.009079466263453167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,256,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,16384,0.03816106716791789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,10240,0.027104000250498455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,3072,65536,0.1318943977355957
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,7168,0.021093332767486574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,6144,0.018959999084472656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,5120,0.01766080061594645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,4096,0.015211733182271323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,3584,0.014042666554450989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,3072,0.013289599617322286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,2048,0.011108266313870747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,2560,0.012288000186284382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,1536,0.010288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,1024,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,512,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,256,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,16384,0.03822933435440064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,10240,0.02744426727294922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,6144,0.01889066696166992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,7168,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2560,65536,0.12997972965240479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,4096,0.01520746648311615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,3584,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,5120,0.01725119948387146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,2048,0.011173333724339802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,3072,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,2560,0.012036266922950744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,1536,0.009897599617640179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,1024,0.009065600236256917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,768,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,512,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,256,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,128,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,12288,0.030377600590387983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,16384,0.03843413194020589
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,6144,0.018897066513697304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,7168,0.02060479919115702
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,2048,65536,0.131549866994222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,3584,0.014108799894650779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,5120,0.017203199863433837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,4096,0.015233066678047181
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,3072,0.013222400347391763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,2560,0.012001066406567892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,2048,0.011059199770291645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,1536,0.010286933183670044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,1024,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,512,0.008306133250395458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,128,0.007460266848405202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,12288,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,16384,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1536,65536,0.1295360008875529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,10240,0.026557866732279462
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,7168,0.020936532815297445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,6144,0.019160532951354982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,5120,0.01726079980532328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,4096,0.015200000007947287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,3584,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,3072,0.012922666470209756
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,2560,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,2048,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,1536,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,1024,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,768,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,256,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,512,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,128,0.007522133489449819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,1024,65536,0.1305941343307495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,12288,0.030377600590387983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,16384,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,8192,0.02300693392753601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,6144,0.01895786722501119
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,5120,0.017259732882181803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,4096,0.015212800105412802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,3584,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,3072,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,2560,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,1536,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,2048,0.011206400394439698
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,1024,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,512,0.008342400193214417
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,65536,0.12963840166727703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,128,0.0074869334697723385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,768,256,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,12288,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,10240,0.026281599203745527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,16384,0.0373418649037679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,6144,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,4096,0.014860799908638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,5120,0.01725013256072998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,3584,0.013994666934013366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,3072,0.013187199831008911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,2560,0.012014933427174886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,2048,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,1536,0.009897599617640179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,1024,0.009128533800443013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,512,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,256,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,65536,0.12943360010782878
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,512,128,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,16384,0.03781973520914714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,12288,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,10240,0.026283733050028485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,8192,0.022732800245285033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,6144,0.018899200359980266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,5120,0.01725119948387146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,4096,0.015210666259129844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,3584,0.014014933506647745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,65536,0.12827306588490803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,3072,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,2560,0.011964799960454305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,1536,0.009967999656995137
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,2048,0.010705066720644633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,1024,0.009125333031018574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,128,0.0074869334697723385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,256,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,16384,0.0373418649037679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,12288,0.030377600590387983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,10240,0.026146133740743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,7168,0.020734934012095134
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,6144,0.01848640044530233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,65536,0.12718079884847006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,5120,0.016909867525100708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,4096,0.015223466356595359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,3584,0.013994666934013366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,3072,0.01276586651802063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,2560,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,2048,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,1024,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,768,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,512,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,1536,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,128,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,384,128,256,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,8192,0.08157866795857747
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,10240,0.09792959690093994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,12288,0.11543893019358317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,7168,0.07215786774953206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,6144,0.062157865365346274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,16384,0.1521663983662923
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,5120,0.05485333204269409
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,4096,0.04669440189997355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,3584,0.04191466569900513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,2560,0.033861335118611655
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,3072,0.03843520085016887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,1536,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,768,0.018820265928904213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,1024,0.02033066749572754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,2048,0.029901866118113202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,128,0.012648533781369528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,256,0.013665067156155905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,65536,512,0.016125866770744325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,10240,0.0315391997496287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,12288,0.03638613224029541
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,16384,0.04457813501358032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,8192,0.026694399118423463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,7168,0.02512213389078776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,6144,0.02217493255933126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,5120,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,4096,0.01752426624298096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,2560,0.014039466778437296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,3072,0.014862933754920959
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,3584,0.01602773368358612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,1536,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,1024,0.009545600414276123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,2048,0.012777599692344665
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,512,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,768,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,256,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,128,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,12288,0.03331413269042969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,16384,0.042461868127187094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,10240,0.02956053415934245
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,8192,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,7168,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,6144,0.021502933899561563
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,4096,0.01694186727205912
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,5120,0.018898133436838785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,3072,0.013983999689420065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,3584,0.01574720044930776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,2048,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,2560,0.012821333607037863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,1024,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,1536,0.01065066655476888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,512,0.008340266346931458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,128,0.007796266674995422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,16384,0.040482131640116374
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,16384,65536,0.1544874668121338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,12288,0.032358400026957196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,10240,0.028331732749938963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,8192,0.024166399240493776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,12288,65536,0.13571732838948566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,6144,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,5120,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,4096,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,3584,0.01520853340625763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,3072,0.01363200048605601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,2048,0.011218133568763732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,1536,0.010288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,2560,0.012754133343696595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,1024,0.009205333391825358
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,768,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,128,0.007495466868082683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,12288,0.03160746693611145
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,16384,0.039389868577321366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,10240,0.028125866254170732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,10240,65536,0.1334272066752116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,8192,0.023894399404525757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,7168,0.021913599967956544
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,6144,0.020530132452646892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,5120,0.018488534291585288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,3584,0.015266133348147073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,4096,0.016029866536458333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,3072,0.013365333278973898
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,1536,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,2048,0.011148800452550251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,2560,0.012435199817021687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,512,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,256,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,128,0.007427200178305308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,12288,0.03099306623140971
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,16384,0.03911786476771037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,10240,0.027510400613149005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,8192,0.023481599489847817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,7168,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,6144,0.020125865936279297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,5120,0.018077866236368815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,4096,0.015564800302187601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,3072,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,3584,0.014390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,2048,0.011128532886505126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,2560,0.011932800213495891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,1024,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,1536,0.009955199559529622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,128,0.007459199925263722
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,8192,65536,0.1291594664255778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,16384,0.03816106716791789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,10240,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,7168,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,6144,0.019377066691716512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,7168,65536,0.130457599957784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,4096,0.015209600329399109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,5120,0.01766080061594645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,2560,0.012025599678357441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,3072,0.013195733229319254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,3584,0.01444906691710154
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,1024,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,2048,0.01114026705423991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,1536,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,512,0.008242133259773254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,128,0.007445333401362102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,12288,0.030511999130249025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,16384,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,10240,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,7168,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,6144,0.019170133272806804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,4096,0.014801067113876343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,5120,0.01765973369280497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,3072,0.01318826675415039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,3584,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,6144,65536,0.12888747056325275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,2560,0.012036266922950744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,2048,0.010806399583816528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,1536,0.009920000036557516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,1024,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,256,0.007863466441631318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,128,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,12288,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,16384,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,10240,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,7168,0.02053440014521281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,6144,0.019307732582092285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,5120,65536,0.12782933712005615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,4096,0.014800000190734863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,5120,0.016851200660069784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,3584,0.013633066415786743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,3072,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,2560,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,2048,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,1536,0.009918933113416035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,1024,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,768,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,256,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,128,0.007480533421039581
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,12288,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,16384,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,10240,0.026283733050028485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,8192,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,7168,0.020529067516326903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,6144,0.018557866414388023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,4096,65536,0.12861440181732178
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,5120,0.01694186727205912
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,3584,0.013972266515096029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,4096,0.014596266547838846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,3072,0.012845866878827415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,2560,0.011991467078526814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,2048,0.010738133390744527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,1536,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,768,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,256,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,128,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,16384,0.037818666299184164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3584,65536,0.1288533369700114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,10240,0.026283733050028485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,5120,0.01684160033861796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,6144,0.01848640044530233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,3584,0.013633066415786743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,3072,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,4096,0.014460800091425577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,1536,0.009896533687909444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,2048,0.010706133643786113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,2560,0.011959466338157653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,256,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,128,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,12288,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,16384,0.0370688001314799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,10240,0.026349866390228273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,3072,65536,0.12731733322143554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,7168,0.020257065693537392
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,6144,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,5120,0.01656426688035329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,4096,0.014826666315396628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,3584,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,3072,0.012812800208727517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,2560,0.011972266435623168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,2048,0.010806399583816528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,1536,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,256,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,12288,0.02983040014902751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,16384,0.03741013209025065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,10240,0.02587413390477498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,8192,0.02218559980392456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2560,65536,0.12745386759440105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,6144,0.01854613423347473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,5120,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,4096,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,3584,0.014042666554450989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,2560,0.011591466267903645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,3072,0.012786133090655008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,1024,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,1536,0.009946667154630025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,768,0.00865600009759267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,256,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,128,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,16384,0.036659200986226395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,2048,65536,0.1273856004079183
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,6144,0.018282665808995565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,7168,0.020126932859420778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,4096,0.014425599575042724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,5120,0.016501333316167197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,3584,0.013570132851600646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,2560,0.01165226697921753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,3072,0.012754133343696595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,2048,0.010708266496658325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,1024,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,1536,0.010013866424560546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,768,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,256,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,16384,0.03652373154958089
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1536,65536,0.12823893229166666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,7168,0.020137600104014077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,5120,0.016835200786590575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,6144,0.018488534291585288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,3584,0.01383786698182424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,4096,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,3072,0.012750933567682901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,2560,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,2048,0.010706133643786113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,1536,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,512,0.008261333405971526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,128,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,1024,65536,0.12650026480356852
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,12288,0.02908160090446472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,16384,0.03659093379974365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,10240,0.025462400913238526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,8192,0.021708800395329794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,7168,0.02018773357073466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,6144,0.01813973387082418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,5120,0.01644159952799479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,4096,0.014791466792424521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,3584,0.013563733299573263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,2048,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,2560,0.011960533261299134
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,3072,0.012342400352160136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,1536,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,256,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,128,0.00729066679875056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,768,65536,0.1261567989985148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,12288,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,8192,0.021766400337219237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,7168,0.020525866746902467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,6144,0.018080000082651773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,4096,0.014792533715566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,5120,0.01644159952799479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,3584,0.01357439955075582
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,3072,0.012846933801968894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,2560,0.01162559986114502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,2048,0.010706133643786113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,1536,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,1024,0.00899839997291565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,768,0.008259200056393941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,65536,0.12489386399586995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,512,128,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,16384,0.03645439942677815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,10240,0.025121066967646283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,8192,0.02177600065867106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,7168,0.020127999782562255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,6144,0.018143999576568603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,5120,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,4096,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,65536,0.1264298677444458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,3584,0.013605333367983499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,3072,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,2048,0.010905599594116211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,1536,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,1024,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,512,0.008341333270072937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,256,256,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,16384,0.03658986488978068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,12288,0.02873813311258952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,8192,0.02216426730155945
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,7168,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,65536,0.12246932983398437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,6144,0.018077866236368815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,4096,0.014485333363215128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,5120,0.016635732849438985
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,3584,0.013229866822560629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,3072,0.012345600128173827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,2048,0.011103999614715577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,2560,0.011583999792734782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,1536,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,1024,0.008692266543706258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,512,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,768,0.008513066172599792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,256,0.007565866907437642
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,256,128,128,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,8192,0.08045120239257812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,10240,0.09939520359039307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,12288,0.11765759785970051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,7168,0.07147520383199056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,6144,0.0634549339612325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,16384,0.1495690663655599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,5120,0.05519253412882487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,4096,0.045670398076375324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,3584,0.04130133390426636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,2560,0.03331306576728821
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,3072,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,768,0.018266665935516357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,1024,0.020525866746902467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,2048,0.02908160090446472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,128,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,512,0.01609173317750295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,256,0.013562666376431784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,65536,1536,0.02444266676902771
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,10240,0.031402667363484696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,12288,0.03590826590855916
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,16384,0.04416960080464681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,8192,0.02648640076319377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,7168,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,6144,0.021824000279108684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,4096,0.017318399747212727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,5120,0.020002132654190062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,3584,0.01602453291416168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,2560,0.013569066921869913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,3072,0.015200000007947287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,1024,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,1536,0.010737066467603047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,2048,0.012165333827336628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,768,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,256,0.00793280005455017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,512,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,128,0.007793066898981731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,12288,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,16384,0.04150613149007161
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,10240,0.029832533995310467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,7168,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,6144,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,5120,0.01916159987449646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,4096,0.01644159952799479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,3072,0.014389333128929139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,3584,0.015610667069753012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,2048,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,2560,0.012754133343696595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,1024,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,1536,0.010718933741251628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,512,0.00830506682395935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,256,0.007894399762153625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,16384,0.040140799681345624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,16384,65536,0.15086933771769206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,12288,0.03256319959958394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,10240,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,8192,0.024100265900293984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,12288,65536,0.135643736521403
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,7168,0.02218559980392456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,6144,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,5120,0.018412800629933675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,4096,0.01609599987665812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,3584,0.015211733182271323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,3072,0.013564800222714743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,2560,0.012378666798273723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,2048,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,1536,0.010354133447011311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,256,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,768,0.008669867118199667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,512,0.00824533353249232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,128,0.007492266595363617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,12288,0.030789333581924438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,16384,0.03891199827194214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,10240,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,10240,65536,0.13209599653879803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,7168,0.021640533208847047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,5120,0.018550399939219156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,6144,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,4096,0.015682133038838704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,3584,0.015269333124160766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,3072,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,1536,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,2048,0.011242666840553283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,2560,0.012337066729863485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,512,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,768,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,128,0.007522133489449819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,256,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,12288,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,16384,0.0392522652943929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,10240,0.026964267094930012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,8192,0.023756800095240276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,7168,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,6144,0.02018773357073466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,5120,0.018003199497858682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,4096,0.015713066856066386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,3584,0.014039466778437296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,3072,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,2560,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,2048,0.011174399654070537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,1024,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,1536,0.010011733571688334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,768,0.008749866485595703
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,256,0.00793280005455017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,8192,65536,0.12957119941711426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,12288,0.030445865790049237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,16384,0.037818666299184164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,10240,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,7168,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,6144,0.019718400637308755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,7168,65536,0.1278282642364502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,4096,0.014802133043607077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,5120,0.017318399747212727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,2560,0.011958400408426922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,3072,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,3584,0.013640532890955607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,1536,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,2048,0.011172266801198323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,256,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,512,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,128,0.0074869334697723385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,12288,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,16384,0.03741013209025065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,7168,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,6144,0.018898133436838785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,5120,0.01684266726175944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,4096,0.014800000190734863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,6144,65536,0.12875093619028727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,3584,0.013662933309872945
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,3072,0.012786133090655008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,1536,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,2048,0.010798933108647664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,2560,0.012025599678357441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,512,0.008235733211040496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,768,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,256,0.007795199751853943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,12288,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,16384,0.037887998421986896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,10240,0.026281599203745527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,6144,0.01930026610692342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,5120,0.01684160033861796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,5120,65536,0.12878399689992268
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,4096,0.014998400211334228
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,2560,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,3072,0.012750933567682901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,3584,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,1024,0.009060266613960265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,1536,0.009918933113416035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,2048,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,256,0.007795199751853943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,128,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,12288,0.030105600754419964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,16384,0.03768320083618164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,10240,0.026693334182103474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,6144,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,7168,0.02066453297932943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,4096,65536,0.12721493244171142
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,4096,0.01492800017197927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,5120,0.016850133736928306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,3584,0.013572266697883606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,3072,0.012845866878827415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,2560,0.011557333668073018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,1536,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,256,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,128,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,16384,0.03741013209025065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3584,65536,0.12683946291605633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,8192,0.02239146629969279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,7168,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,6144,0.018487467368443807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,5120,0.016851200660069784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,3072,0.012754133343696595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,4096,0.014473600188891092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,3584,0.013573333621025085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,2048,0.01076693336168925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,1536,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,1024,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,512,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,768,0.008262399832407634
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,256,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,128,0.007426133255163829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,12288,0.029627732435862225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,16384,0.03672639926274617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,3072,65536,0.12875093619028727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,7168,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,6144,0.01834239959716797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,5120,0.01684373418490092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,3584,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,4096,0.014392532904942832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,3072,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,2560,0.011615999539693196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,1536,0.009944533308347065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,768,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,256,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,128,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,12288,0.029491200049718218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,10240,0.025803732872009277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,8192,0.02177813251813253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2560,65536,0.12690773010253906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,6144,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,7168,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,5120,0.01644159952799479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,3584,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,4096,0.014453333616256715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,3072,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,2048,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,2560,0.011525332927703857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,1024,0.009060266613960265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,1536,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,256,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,128,0.0074325333038965866
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,16384,0.03652160167694092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,6144,0.018081067005793254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,7168,0.020126932859420778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,2048,65536,0.1282058636347453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,5120,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,3584,0.01362986663977305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,4096,0.014393599828084311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,2560,0.012061867117881774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,3072,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,1536,0.009947733084360758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,128,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,12288,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,16384,0.03611413240432739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1536,65536,0.12622506618499757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,8192,0.021639466285705566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,7168,0.02006933291753133
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,6144,0.018078933159510292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,5120,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,4096,0.014382933576901754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,3584,0.013570132851600646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,2560,0.011654399832089742
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,3072,0.012750933567682901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,2048,0.010739200313886007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,1536,0.009943466385205586
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,256,0.007804800073305767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,128,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,1024,65536,0.12707839806874593
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,16384,0.03597546815872192
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,10240,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,7168,0.019715199867884316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,6144,0.018477867046991982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,5120,0.016434133052825928
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,4096,0.014425599575042724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,3584,0.01370133360226949
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,3072,0.012437333663304646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,2560,0.011526399850845337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,1536,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,2048,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,768,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,65536,0.1253376007080078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,256,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,768,128,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,7168,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,6144,0.018077866236368815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,4096,0.014793599645296732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,5120,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,3584,0.01323199967543284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,2560,0.011617066462834676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,3072,0.012845866878827415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,2048,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,1536,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,1024,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,256,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,65536,0.12380159695943196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,512,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,7168,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,6144,0.018078933159510292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,4096,0.014813866217931113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,5120,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,3584,0.013195733229319254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,65536,0.1230847994486491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,3072,0.01276586651802063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,2560,0.011468799908955891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,1536,0.009897599617640179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,2048,0.010706133643786113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,768,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,512,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,256,0.007495466868082683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,256,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,12288,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,7168,0.020118399461110433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,65536,0.12233386834462483
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,6144,0.018080000082651773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,5120,0.016427733500798545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,4096,0.014826666315396628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,3584,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,3072,0.012356266379356384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,2560,0.01149120032787323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,2048,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,1536,0.00950933297475179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,1024,0.00865600009759267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,256,0.007496533294518788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,192,128,128,0.007048533360163371
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,8192,0.08652799924214681
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,10240,0.10212693214416504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,12288,0.11977386474609375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,7168,0.0769717295964559
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,6144,0.06819946765899658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,16384,0.17264639536539714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,5120,0.057652266820271816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,4096,0.04768426815668742
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,2560,0.034203732013702394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,3584,0.0425983985265096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,3072,0.038228265444437665
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,768,0.018273067474365235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,1024,0.020125865936279297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,2048,0.028807467222213744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,128,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,512,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,256,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,65536,1536,0.024918399254480996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,10240,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,12288,0.037409067153930664
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,16384,0.04727466503779094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,8192,0.026828799645106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,7168,0.02430293361345927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,6144,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,4096,0.01712426741917928
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,5120,0.019913599888483683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,3584,0.016023466984430947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,2560,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,3072,0.014798933267593383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,1024,0.009830400347709656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,1536,0.011173333724339802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,2048,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,512,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,768,0.009100799759229023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,256,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,128,0.007828266421953837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,12288,0.03351893424987793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,16384,0.04102826515833537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,10240,0.029422932863235475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,8192,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,7168,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,6144,0.020618667205174766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,4096,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,5120,0.01909439961115519
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,3072,0.014793599645296732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,3584,0.015203199783960977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,2048,0.011482666929562886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,2560,0.012983466188112894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,1024,0.009467732906341553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,1536,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,768,0.009079466263453167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,512,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,128,0.007485866546630859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,256,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,16384,0.040277334054311116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,16384,65536,0.17019200325012207
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,12288,0.032494932413101196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,10240,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,12288,65536,0.13878614107767742
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,6144,0.020528000593185425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,7168,0.02177813251813253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,5120,0.018501333395640054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,4096,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,3584,0.014525866508483887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,3072,0.013707733154296875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,1536,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,2048,0.011115733782450359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,2560,0.012810666362444559
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,512,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,256,0.007842133442560833
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,128,0.007492266595363617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,16384,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,10240,0.02730773289998372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,10240,65536,0.13025279839833576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,8192,0.023483733336130776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,6144,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,7168,0.02177493373552958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,5120,0.01842026710510254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,3072,0.013160533706347146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,3584,0.014389333128929139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,4096,0.01527253290017446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,1536,0.009979733824729919
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,2048,0.0107722669839859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,2560,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,1024,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,512,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,65536,0.13004906972249347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,16384,0.03925333420435588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,256,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,12288,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,65536,0.12851200103759766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,10240,0.02696533401807149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,8192,0.023757867018381753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,6144,0.019363200664520262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,7168,0.021845332781473794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,5120,0.018205867211023966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,4096,0.015202132860819497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,3584,0.01432319978872935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,2560,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,3072,0.013290666540463767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,2048,0.0107722669839859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,1024,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,768,0.0086709330479304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,1536,0.009944533308347065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,256,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,7168,128,0.007490133245786031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,12288,0.030037333567937214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,16384,0.03857066631317139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,7168,0.020936532815297445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,6144,0.0197760005791982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,5120,0.017525333166122436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,4096,0.01567893326282501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,3072,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,3584,0.013993600010871887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,2048,0.010761599739392598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,2560,0.012027733524640401
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,1024,0.009127466877301534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,1536,0.010012800494829815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,768,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,128,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,256,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,8192,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,16384,0.037478399276733396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,12288,0.029967999458312987
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,6144,0.018898133436838785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,4096,0.014791466792424521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,5120,0.016849066813786825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,6144,65536,0.1282047986984253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,3584,0.01363200048605601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,2560,0.011932800213495891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,3072,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,2048,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,1024,0.008999466896057129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,1536,0.009918933113416035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,768,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,512,0.00824533353249232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,12288,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,16384,0.037275731563568115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,8192,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,7168,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,5120,65536,0.12888747056325275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,6144,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,3584,0.013605333367983499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,4096,0.01486186683177948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,5120,0.016850133736928306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,2048,0.010739200313886007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,2560,0.011994666854540507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,3072,0.012443733215332032
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,1024,0.009057066837946574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,1536,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,768,0.008316799998283386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,128,0.007396266857783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,12288,0.029628799359003706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,16384,0.0373418649037679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,6144,0.018488534291585288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,7168,0.020127999782562255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,4096,65536,0.12666880289713542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,4096,0.014404267072677612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,3584,0.013563733299573263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,5120,0.01671573321024577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,2048,0.010738133390744527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,2560,0.011617066462834676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,3072,0.012410666545232136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,1024,0.009060266613960265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,1536,0.009830400347709656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,512,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,256,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,128,0.007396266857783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,12288,0.029491200049718218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,16384,0.03700266679128011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3584,65536,0.12806826432545979
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,8192,0.022050132354100548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,6144,0.018080000082651773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,5120,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,4096,0.014851199587186179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,3072,0.012444800138473511
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,3584,0.013605333367983499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,2560,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,1536,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,256,0.007796266674995422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,128,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,12288,0.029219200213750202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,16384,0.037206399440765384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,10240,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,8192,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,3072,65536,0.12646400133768718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,7168,0.0197269340356191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,6144,0.018549333016077675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,5120,0.016430933276812235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,4096,0.014387200276056925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,3584,0.013737600048383078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,3072,0.012779733538627625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,2048,0.011106133460998535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,2560,0.011557333668073018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,1536,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,1024,0.009050666292508443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,512,0.008242133259773254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,256,0.007826133569081625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,128,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,12288,0.029150933027267456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,16384,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,10240,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,8192,0.022165334224700926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2560,65536,0.12649599711100262
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,7168,0.020070399840672812
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,6144,0.018481065829594932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,5120,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,4096,0.014390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,3584,0.013665067156155905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,3072,0.012356266379356384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,2560,0.011591466267903645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,768,0.008317866424719492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,128,0.007426133255163829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,2048,65536,0.12578240235646565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,6144,0.018078933159510292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,7168,0.019717333714167277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,4096,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,5120,0.016433067123095193
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,3584,0.01323199967543284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,2560,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,3072,0.012356266379356384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,2048,0.010707199573516846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,1536,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,1024,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,512,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,256,0.007835733393828075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,128,0.007393066585063934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,16384,0.036111998558044436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1536,65536,0.12735146681467693
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,8192,0.021708800395329794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,7168,0.020137600104014077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,6144,0.018080000082651773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,5120,0.016438399751981102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,4096,0.01479039986928304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,3584,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,2560,0.011958400408426922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,3072,0.012410666545232136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,2048,0.010738133390744527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,1536,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,256,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,128,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,1024,65536,0.12506453196207684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,12288,0.029286400477091475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,16384,0.03597653309504191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,8192,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,7168,0.019715199867884316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,6144,0.01806933283805847
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,5120,0.016839466492335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,3584,0.013222400347391763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,4096,0.014392532904942832
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,3072,0.012846933801968894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,2560,0.01165226697921753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,1536,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,1024,0.009060266613960265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,768,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,256,0.007558399935563405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,65536,0.1238368034362793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,768,128,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,12288,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,7168,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,8192,0.02136960029602051
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,6144,0.018040533860524496
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,5120,0.016428800423940022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,4096,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,3584,0.01322879989941915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,3072,0.012425600488980611
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,2560,0.011557333668073018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,1536,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,1024,0.008690133690834045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,768,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,65536,0.12561066945393878
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,512,0.007933866480986278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,256,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,512,128,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,7168,0.01998293399810791
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,6144,0.018080000082651773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,5120,0.016428800423940022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,4096,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,65536,0.12390399773915609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,3584,0.01317759950955709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,3072,0.012355200449625651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,2048,0.010851200421651204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,2560,0.011558399597803751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,1536,0.009545600414276123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,1024,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,768,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,128,0.007417599856853485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,256,256,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,10240,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,65536,0.12281173070271809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,7168,0.019709867238998414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,6144,0.01773653427759806
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,5120,0.016099199652671814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,4096,0.014450132846832275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,2560,0.011102933684984844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,1536,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,3072,0.011935999989509583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,512,0.007874133189519246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,256,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,128,0.006995200117429097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,160,128,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,10240,0.07376213073730468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,12288,0.08563946882883708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,8192,0.06263466676076254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,16384,0.11270826657613117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,7168,0.05451093514760336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,6144,0.048196268081665036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,5120,0.0421887993812561
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,3584,0.031675734122594196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,4096,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,3072,0.028535467386245728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,2560,0.02553173303604126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,768,0.013563733299573263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,1024,0.014521599809328715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,256,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,1536,0.01842026710510254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,128,0.009603200356165568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,512,0.011545600493748982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,65536,2048,0.021572266022364298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,10240,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,12288,0.03399680058161418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,16384,0.04232639869054158
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,8192,0.025326933463414508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,7168,0.023550933599472045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,6144,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,4096,0.016565333803494772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,5120,0.01884160041809082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,3584,0.015201066931088766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,2560,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,3072,0.013972266515096029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,1024,0.009125333031018574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,1536,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,768,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,2048,0.011515733599662781
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,128,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,256,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,12288,0.03222186764081319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,16384,0.039868799845377605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,10240,0.028194133440653486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,7168,0.021844265858332317
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,6144,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,4096,0.015677866339683533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,5120,0.01813760002454122
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,3072,0.014007467031478881
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,3584,0.014588800072669984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,2048,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,2560,0.012471466263135274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,1024,0.009127466877301534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,1536,0.010012800494829815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,768,0.00864746669928233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,128,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,256,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,16384,0.03911679983139038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,16384,65536,0.14178986549377443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,12288,0.0315391997496287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,12288,65536,0.13189226786295574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,7168,0.02136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,6144,0.019847466548283895
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,5120,0.017681066195170084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,3584,0.014856533209482829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,4096,0.015348266561826071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,3072,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,2048,0.010805333654085796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,1536,0.009918933113416035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,2560,0.012335999806722005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,512,0.008237866560618083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,1024,0.008727467060089112
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,128,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,12288,0.030719999472300214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,16384,0.03863893349965413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,10240,0.027101866404215497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,10240,65536,0.12912639776865642
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,7168,0.02136853337287903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,5120,0.01725013256072998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,6144,0.01930026610692342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,3072,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,3584,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,4096,0.014802133043607077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,2560,0.01165013313293457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,2048,0.011172266801198323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,1536,0.009920000036557516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,768,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,1024,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,128,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,12288,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,16384,0.03781973520914714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,7168,0.02120959957440694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,6144,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,5120,0.01766080061594645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,4096,0.015211733182271323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,3072,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,3584,0.013972266515096029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,2048,0.010786133011182149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,2560,0.011932800213495891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,1024,0.008669867118199667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,1536,0.009920000036557516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,768,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,128,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,8192,65536,0.12704426447550457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,16384,0.037478399276733396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,10240,0.025942399104436235
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,6144,0.018899200359980266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,7168,0.020753065745035805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,7168,65536,0.12660053571065266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,4096,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,5120,0.016714666287104288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,3584,0.013634133338928222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,3072,0.01234346628189087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,1536,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,2048,0.010762666662534077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,256,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,768,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,12288,0.029627732435862225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,10240,0.025872000058492023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,8192,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,7168,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,6144,0.018489599227905273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,5120,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,4096,0.014459733168284097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,6144,65536,0.1278282642364502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,3584,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,3072,0.012785067160924276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,2560,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,1536,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,2048,0.010807466506958009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,512,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,128,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,256,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,12288,0.029491200049718218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,10240,0.025872000058492023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,8192,0.022525866826375328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,7168,0.020206934213638304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,6144,0.018480000893274943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,5120,65536,0.12608853181203206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,5120,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,4096,0.014451199769973755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,3584,0.01325653294722239
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,2560,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,3072,0.012342400352160136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,2048,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,1536,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,768,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,256,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,12288,0.02955840031305949
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,8192,0.02155839999516805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,7168,0.020137600104014077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,6144,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,4096,65536,0.1260543982187907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,5120,0.016429866353670754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,4096,0.013978667060534158
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,3584,0.01322879989941915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,2048,0.010718933741251628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,2560,0.011558399597803751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,3072,0.012470400333404541
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,1536,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,512,0.008273066580295562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,128,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,16384,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3584,65536,0.1261567989985148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,8192,0.021822933355967203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,7168,0.0197269340356191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,5120,0.016463999946912132
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,6144,0.017874133586883546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,3584,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,4096,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,3072,0.01241386632124583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,2048,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,1536,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,2560,0.011618133385976155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,512,0.008237866560618083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,1024,0.009033600489298504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,768,0.008316799998283386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,256,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,16384,0.03631786505381267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,8192,0.021436800559361778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,3072,65536,0.12683946291605633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,7168,0.020137600104014077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,6144,0.018068265914916993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,5120,0.016029866536458333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,4096,0.014382933576901754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,3584,0.013222400347391763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,3072,0.012342400352160136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,2560,0.01165120005607605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,1536,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,1024,0.009057066837946574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,256,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,128,0.007417599856853485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,10240,0.02553173303604126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2560,65536,0.12588266531626385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,7168,0.019777067502339683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,6144,0.01802026629447937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,5120,0.016029866536458333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,3584,0.01325653294722239
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,4096,0.014416000247001648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,2048,0.010833066701889039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,3072,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,2560,0.011620266238848369
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,768,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,1536,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,1024,0.008726400136947633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,512,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,256,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,16384,0.03631786505381267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,2048,65536,0.12595199743906657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,7168,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,6144,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,4096,0.014381866653760275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,5120,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,3584,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,3072,0.012401066223780314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,1536,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,512,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,256,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,65536,0.12479146321614583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,16384,0.03536213239034017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,8192,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,7168,0.0193066676457723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,6144,0.017729065815607705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,5120,0.016029866536458333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,4096,0.014039466778437296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,3584,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,3072,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,65536,0.12492907047271729
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,2048,0.010390399893124899
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,1536,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,768,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,512,0.008237866560618083
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,256,0.007462400197982788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1024,128,0.0073183998465538025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,16384,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,10240,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,8192,0.021342933177947998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,6144,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,5120,0.01602133313814799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,4096,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,65536,0.12472319602966309
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,3072,0.012034133076667786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,2048,0.010696533322334289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,1024,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,1536,0.009476266304651896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,768,0.008644266923268636
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,512,0.007895466685295106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,768,128,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,16384,0.03529599905014038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,7168,0.019843200842539467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,6144,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,5120,0.01609173317750295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,4096,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,65536,0.12055786450703938
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,2560,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,3072,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,2048,0.01071679989496867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,1536,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,768,0.00864746669928233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,1024,0.008654933174451191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,512,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,256,0.007795199751853943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,512,128,0.007426133255163829
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,8192,0.02116159995396932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,65536,0.12025173505147298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,7168,0.0197760005791982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,6144,0.017670400937398276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,5120,0.01601920028527578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,4096,0.014385066429773965
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,3584,0.013107200463612875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,3072,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,2560,0.011580800016721089
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,2048,0.010293333729108175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,1536,0.009894399841626485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,1024,0.009054932991663616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,512,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,256,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,768,0.00824533353249232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,256,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,16384,0.035225598017374675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,65536,0.1213098684946696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,7168,0.019368533293406168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,6144,0.018071466684341432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,5120,0.015687466661135355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,3584,0.013155200084050498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,4096,0.014006400108337402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,3072,0.012167466680208842
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,2560,0.01165120005607605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,256,0.007828266421953837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,128,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,1536,2560,0.011148800452550251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,128,128,1536,0.009474133451779682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,12288,0.08434240023295084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,10240,0.0738645315170288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,8192,0.0606549342473348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,16384,0.11223039627075196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,5120,0.04157333374023438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,6144,0.04980053504308064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,7168,0.053623465696970615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,4096,0.0362496018409729
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,2560,0.02539520064989726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,3072,0.029628799359003706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,3584,0.031879466772079465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,2048,0.02198186715443929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,1024,0.014797866344451904
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,1536,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,768,0.013639466961224875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,128,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,512,0.011175466577212016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,65536,256,0.009921066959698995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,10240,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,12288,0.03365653355916341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,16384,0.04184639851252238
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,8192,0.02484906713167826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,7168,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,6144,0.020207999149958293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,5120,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,4096,0.01622719963391622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,2560,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,3584,0.014792533715566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,3072,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,1024,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,1536,0.009944533308347065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,2048,0.01192639966805776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,768,0.008317866424719492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,512,0.007901866734027863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,256,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,12288,0.031470932563145954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,16384,0.03993599812189738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,10240,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,8192,0.023550933599472045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,7168,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,6144,0.019843200842539467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,5120,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,4096,0.01574613352616628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,3072,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,3584,0.014596266547838846
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,2048,0.010735999544461567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,2560,0.012061867117881774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,1536,0.009920000036557516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,768,0.008682666222254436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,256,0.007863466441631318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,16384,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,16384,65536,0.14479360580444336
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,12288,0.03065173427263896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,10240,0.026284799973169966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,12288,65536,0.1311733325322469
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,6144,0.019639466206232706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,7168,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,5120,0.017593600352605186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,3072,0.012950399518013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,4096,0.015610667069753012
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,3584,0.014082133769989014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,1536,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,2048,0.010787199934323628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,2560,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,512,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,768,0.008631466825803121
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,1024,0.008726400136947633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,256,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,12288,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,16384,0.03768320083618164
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,10240,0.026555732885996504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,10240,65536,0.12916053136189778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,5120,0.01725226640701294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,7168,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,6144,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,3072,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,3584,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,4096,0.014825600385665893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,1536,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,2048,0.01069546639919281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,2560,0.011592533191045125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,1024,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,128,0.0074527998765309645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,256,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,16384,0.037956265608469646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,10240,0.026077866554260254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,8192,0.022870399554570518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,6144,0.019708800315856933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,5120,0.01684266726175944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,4096,0.015134933590888976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,3584,0.01363200048605601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,3072,0.012778666615486146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,2048,0.01074026624361674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,2560,0.011618133385976155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,1024,0.008718933661778767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,1536,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,768,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,128,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,256,0.007850666840871174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,8192,65536,0.1272469361623128
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,12288,0.02949013312657674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,8192,0.022252800067265828
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,6144,0.018500266472498576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,7168,0.020533333222071327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,5120,0.016499200463294984
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,4096,0.014186666409174601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,7168,65536,0.12731733322143554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,2560,0.011522133151690166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,3584,0.013326932986577352
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,1536,0.009533866246541341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,2048,0.010397866368293762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,1024,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,256,0.007704533139864604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,65536,0.127729066212972
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,8192,0.022529067595799764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,7168,0.020480000972747804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,5120,0.016438399751981102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,6144,0.018481065829594932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,3584,0.013666133085886637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,4096,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,3072,0.012357333302497863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,2560,0.011525332927703857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,2048,0.010750933488210043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,768,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,256,0.007795199751853943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,128,0.007522133489449819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,5120,65536,0.1257130702336629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,16384,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,12288,0.029150933027267456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,10240,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,6144,3072,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,7168,0.019933867454528808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,6144,0.018068265914916993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,5120,0.01602773368358612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,4096,0.014382933576901754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,3072,0.01234346628189087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,2560,0.011617066462834676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,2048,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,768,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,512,0.007895466685295106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,16384,0.03611413240432739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,10240,0.02532586654027303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,4096,65536,0.12690773010253906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,6144,0.01807253360748291
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,7168,0.019716266791025797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,5120,0.016032000382741295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,3584,0.013229866822560629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,4096,0.01414293348789215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,3072,0.012410666545232136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,2560,0.011538133025169373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,1024,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,512,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,256,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,128,0.0070826664566993715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,10240,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3584,65536,0.12707626819610596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,8192,0.021348265806833903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,6144,0.01806933283805847
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,5120,0.01602133313814799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,7168,0.019444266955057778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,3584,0.013157332936922709
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,3072,0.012342400352160136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,4096,0.014382933576901754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,1536,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,2048,0.010601600011189777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,2560,0.011552000045776367
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,1024,0.009079466263453167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,256,0.007490133245786031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,12288,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,16384,0.035837864875793456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,8192,0.02136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,3072,65536,0.12561066945393878
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,7168,0.019777067502339683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,6144,0.017730132738749186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,5120,0.016032000382741295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,4096,0.014109866817792258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,2048,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,3072,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,768,0.00844586690266927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,1536,0.009673600395520527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,512,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,256,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,128,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,12288,0.028331732749938963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,16384,0.035947732130686444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2560,65536,0.12608853181203206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,6144,0.01772800087928772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,5120,0.016032000382741295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,7168,0.019307732582092285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,3584,0.01316373348236084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,4096,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,3072,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,2048,0.010696533322334289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,2560,0.011217066645622253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,1024,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,256,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,12288,0.028329600890477497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,16384,0.03543039957682292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,8192,0.02116159995396932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,6144,0.017729065815607705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,2048,65536,0.12581546306610109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,4096,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,5120,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,3584,0.01325653294722239
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,2048,0.010698666175206501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,2560,0.011241599917411804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,3072,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,1536,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,128,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1536,65536,0.12438186804453533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,8192,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,7168,0.019307732582092285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,5120,0.016123732924461363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,6144,0.01726079980532328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,3584,0.01325759987036387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,3072,0.01200213332970937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,2048,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,2560,0.011515733599662781
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,1024,0.009048533439636231
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,1536,0.00942080020904541
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,128,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,65536,0.1241429328918457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,12288,0.027988266944885255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,16384,0.03529493411382039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,8192,0.020959999163945517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,6144,0.01766293247540792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,7168,0.0193066676457723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,5120,0.01602453291416168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,4096,0.013983999689420065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,3584,0.013220266501108805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,3072,0.01200320025285085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,65536,0.1237674633661906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,2560,0.011548800269762675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,2048,0.010327466328938802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,1024,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,1536,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,768,128,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,6144,0.018068265914916993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,5120,0.016088533401489257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,4096,0.013983999689420065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,3072,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,3584,0.01325440009435018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,65536,0.12014933427174886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,1536,0.009533866246541341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,2560,0.011181867122650147
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,256,0.007490133245786031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,512,128,0.0074869334697723385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,12288,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,16384,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,65536,0.12001279989878337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,7168,0.019707733392715455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,6144,0.01807039976119995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,5120,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,4096,0.014108799894650779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,3072,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,2560,0.011583999792734782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,2048,0.010796800255775452
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,1024,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,1536,0.00942186713218689
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,768,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,512,0.007833600044250488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,128,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,256,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,10240,0.024642133712768556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,65536,0.11963733037312825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,7168,0.019708800315856933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,6144,0.01753173271814982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,5120,0.01601066688696543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,4096,0.013994666934013366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,3072,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,3584,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,2048,0.010289067029953003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,2560,0.011517866452534994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,1024,0.008718933661778767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,768,0.008306133250395458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,256,0.007521066566308339
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,128,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,96,1024,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,10240,0.07584319909413656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,8192,0.062156800429026285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,12288,0.08628906408945719
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,5120,0.04396479924519857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,16384,0.11468799908955891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,7168,0.05464853445688883
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,6144,0.048163199424743654
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,3072,0.029013333717981975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,2560,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,3584,0.03392639954884847
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,4096,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,1024,0.015281066298484802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,1536,0.018281600872675576
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,768,0.013219199577967324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,128,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,512,0.01121493379275004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,256,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,65536,2048,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,10240,0.029832533995310467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,12288,0.03331519961357117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,16384,0.04184853235880534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,8192,0.02519039909044902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,7168,0.022526933749516805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,6144,0.020205867290496827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,4096,0.016028799613316855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,5120,0.018478933970133463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,2560,0.013220266501108805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,3584,0.014798933267593383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,3072,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,1024,0.008725333213806152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,1536,0.010171733299891154
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,2048,0.01185706655184428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,256,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,768,0.008518399794896443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,12288,0.031335467100143434
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,16384,0.03979733387629191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,10240,0.028125866254170732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,7168,0.02136853337287903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,6144,0.019715199867884316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,5120,0.017670400937398276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,4096,0.015348266561826071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,3072,0.013605333367983499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,3584,0.014460800091425577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,2048,0.010737066467603047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,2560,0.012376532951990763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,1536,0.00974826713403066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,512,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,128,0.007086933155854543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,256,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,16384,0.03911679983139038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,16384,65536,0.14138026237487794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,12288,0.030584534009297688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,8192,0.02300693392753601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,12288,65536,0.1305941343307495
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,7168,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,6144,0.0193066676457723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,5120,0.01772800087928772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,4096,0.015200000007947287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,3072,0.013223466277122498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,3584,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,1536,0.009508267045021057
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,2560,0.011576533317565918
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,2048,0.010797866185506185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,768,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,128,0.007413333157698314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,256,0.007764266431331634
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,16384,0.03822933435440064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,10240,65536,0.12799999713897706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,8192,0.022938666741053264
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,7168,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,5120,0.017658666769663493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,6144,0.019103999932607016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,4096,0.014793599645296732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,3584,0.013972266515096029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,3072,0.012342400352160136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,1536,0.009512533744176228
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,2048,0.010698666175206501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,2560,0.011515733599662781
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,768,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,256,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,12288,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,8192,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,7168,0.020936532815297445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,6144,0.018820265928904213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,5120,0.01725119948387146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,4096,0.014452266693115234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,3072,0.012404266993204753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,3584,0.013633066415786743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,2560,0.011515733599662781
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,1024,0.008718933661778767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,1536,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,768,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,512,0.007892266909281413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,256,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,128,0.007418666779994964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,8192,65536,0.1272810697555542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,12288,0.029625600576400755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,16384,0.037478399276733396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,10240,0.026284799973169966
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,8192,0.022574933369954427
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,6144,0.019157334168752035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,7168,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,7168,65536,0.1261578639348348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,5120,0.016703999042510985
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,2560,0.011583999792734782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,3072,0.012342400352160136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,3584,0.013572266697883606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,1536,0.009476266304651896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,2048,0.010831999778747558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,512,0.007930666704972585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,256,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,12288,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,10240,0.02614826758702596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,8192,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,7168,0.02034453352292379
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,6144,0.018488534291585288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,4096,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,5120,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,6144,65536,0.12598613103230794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,3584,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,3072,0.012469333410263062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,2560,0.011548800269762675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,1536,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,2048,0.010307199756304423
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,1024,0.008718933661778767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,768,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,512,0.007850666840871174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,256,0.007490133245786031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,16384,0.03618133465449015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,7168,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,6144,0.01806933283805847
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,5120,65536,0.1257472038269043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,4096,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,5120,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,3584,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,2560,0.011661866307258606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,3072,0.012370133399963379
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,1024,0.00871573289235433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,2048,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,1536,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,256,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,768,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,512,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,12288,0.029287467400232952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,16384,0.03631786505381267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,8192,0.021572266022364298
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,7168,0.020119466384251914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,4096,65536,0.12602026462554933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,6144,0.017667200167973837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,4096,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,3584,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,5120,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,2560,0.011139200131098429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,3072,0.01234346628189087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,1536,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,256,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,128,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,12288,0.02879573305447896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,16384,0.03645439942677815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3584,65536,0.1254730701446533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,10240,0.02518933415412903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,5120,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,6144,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,4096,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,3584,0.013196800152460733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,3072,0.012272000312805176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,2560,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,2048,0.010398933291435241
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,1024,0.008714666962623597
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,768,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,256,0.00749120016892751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,128,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,10240,0.02512213389078776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,8192,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,3072,65536,0.12649813493092854
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,6144,0.01807253360748291
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,5120,0.016088533401489257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,3584,0.013153066237767538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,4096,0.013978667060534158
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,3072,0.012355200449625651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,2048,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,2560,0.011549866199493409
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,1536,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,768,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,1024,0.0086709330479304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,256,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,16384,0.03618239959081014
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,65536,0.12540586789449054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,12288,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,8192,0.02141653299331665
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,10240,0.024779733022054037
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,7168,0.019386667013168334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,6144,0.01767146587371826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,5120,0.016088533401489257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,4096,0.014014933506647745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,3584,0.013222400347391763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,3072,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,2560,0.011583999792734782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,1536,0.009830400347709656
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,768,0.008378666639328004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,512,0.007869866490364075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,256,0.007863466441631318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,65536,0.1252351999282837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2048,128,0.007394133508205414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,8192,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,6144,0.017661867539087932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,7168,0.019308799505233766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,5120,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,4096,0.013673599561055502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,3584,0.013176533579826354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,3072,0.012035199999809265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,2560,0.011512533823649088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,1536,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,256,0.007416533430417378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,512,0.007874133189519246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,128,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1536,65536,0.1257813294728597
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,16384,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,12288,0.028350933392842607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,8192,0.021436800559361778
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,6144,0.01772800087928772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,5120,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,4096,0.014039466778437296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,3584,0.013156267007191977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,3072,0.012435199817021687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,2560,0.011585066715876263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,2048,0.010696533322334289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,1536,0.00947093367576599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,65536,0.12247040271759033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,1024,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,256,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,512,0.0076341331005096436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,1024,128,0.007076266904671986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,7168,0.01936533252398173
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,6144,0.017259732882181803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,5120,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,4096,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,3584,0.013154133160909017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,3072,0.011923199892044068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,65536,0.12151467005411784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,2560,0.01120853324731191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,1024,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,1536,0.00981119970480601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,2048,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,768,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,256,0.0074976002176602675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,768,128,0.007285333176453908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,8192,0.020946133136749267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,7168,0.019320533672968546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,6144,0.017326933145523072
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,5120,0.01567893326282501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,65536,0.12127573490142822
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,3584,0.013224533200263977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,2560,0.011515733599662781
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,3072,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,2048,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,1536,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,512,0.00793280005455017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,128,0.007284266750017802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,512,256,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,16384,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,8192,0.02094399929046631
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,65536,0.1213098684946696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,7168,0.019301333030064902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,6144,0.017258665959040322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,5120,0.016123732924461363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,4096,0.01397546629110972
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,3072,0.01276693344116211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,2560,0.011241599917411804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,3584,0.013196800152460733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,1536,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,2048,0.010680533448855082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,1024,0.00862506628036499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,256,0.0074986666440963745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,128,0.007441066702206929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,16384,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,65536,0.11939840316772461
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,8192,0.020946133136749267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,7168,0.01936639944712321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,6144,0.01726079980532328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,5120,0.016023466984430947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,3584,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,4096,0.014013866583506266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,3072,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,2560,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,2048,0.010427733262379963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,1024,0.0086517333984375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,768,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,256,0.007418666779994964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,128,128,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,2560,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,80,256,512,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,10240,0.07434240182240805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,12288,0.08584533532460531
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,8192,0.062122666835784913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,16384,0.11615573565165202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,7168,0.059699201583862306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,6144,0.050826664765675864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,5120,0.04505493243535359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,3584,0.03242666721343994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,4096,0.03741013209025065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,2560,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,3072,0.02997013330459595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,1024,0.014855466286341348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,768,0.013573333621025085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,1536,0.01904746691385905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,512,0.01165226697921753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,256,0.00950933297475179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,128,0.009128533800443013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,65536,2048,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,10240,0.029286400477091475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,12288,0.03310933311780294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,16384,0.04143786827723185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,8192,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,7168,0.022529067595799764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,6144,0.020057600736618043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,4096,0.015889066457748412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,5120,0.018148267269134523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,3584,0.014800000190734863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,3072,0.013699199755986533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,2560,0.013026133179664612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,1024,0.0086709330479304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,1536,0.009879466891288758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,2048,0.011556266744931539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,768,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,512,0.008270933230717977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,256,0.007492266595363617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,12288,0.03139946659406026
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,16384,0.0395957350730896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,10240,0.0277834673722585
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,7168,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,6144,0.019375999768575035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,5120,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,4096,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,3584,0.014459733168284097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,3072,0.013229866822560629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,2560,0.012342400352160136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,1536,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,512,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,128,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,16384,0.03850239912668864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,16384,65536,0.1416543960571289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,12288,0.030377600590387983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,8192,0.02259733279546102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,12288,65536,0.13315412998199463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,7168,0.02136853337287903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,5120,0.01731733282407125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,6144,0.019308799505233766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,4096,0.0156768004099528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,3584,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,3072,0.012819199760754903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,1536,0.009544533491134644
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,2048,0.010833066701889039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,2560,0.01202880044778188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,512,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,768,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,256,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,128,0.007359999914964039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,12288,0.029286400477091475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,16384,0.03816106716791789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,10240,65536,0.12834133307139078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,5120,0.017525333166122436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,6144,0.018908800681432088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,3072,0.012410666545232136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,3584,0.013665067156155905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,4096,0.014834133783976236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,2048,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,2560,0.011525332927703857
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,1536,0.009545600414276123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,1024,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,128,0.007189333438873291
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,12288,0.029491200049718218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,16384,0.037205334504445395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,10240,0.025872000058492023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,8192,0.022325332959493002
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,7168,0.02053546706835429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,6144,0.018897066513697304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,4096,0.014731733004252115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,5120,0.017052799463272095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,3584,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,3072,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,2560,0.011556266744931539
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,2048,0.010295466581980387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,8192,65536,0.12639573415120442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,768,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,128,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,12288,0.029491200049718218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,16384,0.03734399875005086
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,10240,0.026146133740743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,8192,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,6144,0.018481065829594932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,7168,65536,0.12683946291605633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,5120,0.016850133736928306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,4096,0.014043733477592468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,2560,0.01158186693986257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,3072,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,3584,0.01339413324991862
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,1024,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,1536,0.009475200374921163
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,2048,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,256,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,16384,0.03645439942677815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,10240,0.026011733214060466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,8192,0.02198186715443929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,7168,0.02018773357073466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,6144,0.018078933159510292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,4096,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,5120,0.0160863995552063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,3584,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,3072,0.012436266740163167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,6144,65536,0.12557653586069745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,2048,0.01074026624361674
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,1536,0.009545600414276123
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,2560,0.011523200074831645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,1024,0.008750933408737182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,16384,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,10240,0.025804799795150758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,8192,0.021961599588394165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,7168,0.020002132654190062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,6144,0.01814080079396566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,5120,65536,0.12547413508097333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,5120,0.016032000382741295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,4096,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,3584,0.013153066237767538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,2048,0.010423466563224792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,2560,0.011618133385976155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,3072,0.01234346628189087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,1024,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,1536,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,256,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,128,0.007293866574764251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,12288,0.029421865940093994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,16384,0.036593067646026614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,7168,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,4096,65536,0.12540586789449054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,6144,0.018023467063903807
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,3584,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,5120,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,4096,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,2560,0.011538133025169373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,3072,0.01234346628189087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,1536,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,256,0.007696000238259633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,128,0.007226666808128357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,16384,0.03645333449045817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3584,65536,0.12547413508097333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,5120,0.015822933117548624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,7168,0.019367466370264687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,6144,0.017667200167973837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,3584,0.013154133160909017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,3072,0.012168533603350322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,4096,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,1536,0.009476266304651896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,2560,0.011238400141398113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,2048,0.01032319962978363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,512,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,128,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,12288,0.02874133388201396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,8192,0.020958934227625528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,3072,65536,0.12683946291605633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,6144,0.01772800087928772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,5120,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,3584,0.013153066237767538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,3072,0.012354133526484172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,2048,0.010354133447011311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,2560,0.011558399597803751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,1536,0.00953493316968282
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,1024,0.008710400263468424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,128,0.00722453345855077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,16384,0.0357045332590739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,10240,0.024851200977961223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2560,65536,0.12527039845784504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,6144,0.017661867539087932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,5120,0.016029866536458333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,3584,0.013154133160909017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,3072,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,2560,0.01120853324731191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,1536,0.009476266304651896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,768,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,1024,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,256,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,12288,0.027922133604685467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,16384,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,10240,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,2048,65536,0.12588160037994384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,6144,0.01766293247540792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,7168,0.019307732582092285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,3584,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,4096,0.013993600010871887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,5120,0.016089600324630738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,2048,0.0105813334385554
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,2560,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,3072,0.01199893355369568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,1024,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,1536,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,768,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,128,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,16384,0.035225598017374675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,65536,0.12410879929860433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,12288,0.027922133604685467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,10240,0.02423680027325948
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,8192,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,7168,0.019307732582092285
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,6144,0.017670400937398276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,5120,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,4096,0.013845333456993103
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,65536,0.12062719662984211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,3072,0.011934933066368104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,3584,0.012821333607037863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,2560,0.011342933773994446
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,2048,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,768,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,512,0.007805866499741872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,256,0.007490133245786031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1024,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,16384,0.03522773186365764
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,6144,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,4096,0.013974400361378989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,5120,0.015827199816703795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,3584,0.013153066237767538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,3072,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,65536,0.12052480379740398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,2560,0.011412266890207927
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,2048,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,768,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,512,0.007825066645940144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,256,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,768,128,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,8192,0.020948266983032225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,7168,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,6144,0.017257599035898845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,5120,0.015825066963831583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,4096,0.01360640029112498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,65536,0.11991039911905925
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,3584,0.012889599800109864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,3072,0.011934933066368104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,2560,0.011175466577212016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,1024,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,768,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,512,0.007829333345095318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,128,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,512,256,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,8192,0.02094506621360779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,65536,0.11950080394744873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,7168,0.019237333536148073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,6144,0.01726186672846476
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,5120,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,4096,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,3072,0.012403200070063274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,3584,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,2560,0.011148800452550251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,2048,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,1536,0.009476266304651896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,768,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,128,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,256,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,65536,0.11933013598124187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,8192,0.020947200059890748
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,7168,0.01917440096537272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,6144,0.01766080061594645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,5120,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,3584,0.013187199831008911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,3072,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,2560,0.011549866199493409
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,2048,0.01030613382657369
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,1024,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,768,0.007835733393828075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,512,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,256,0.007153066496054332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,128,128,0.007054933408896129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,64,1536,256,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,10240,0.07342080275217691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,8192,0.06205546855926514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,12288,0.08898560206095377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,16384,0.12393813133239746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,6144,0.05331626733144125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,7168,0.05758293469746908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,5120,0.04266560077667236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,2560,0.02553279995918274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,3072,0.03010666569073995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,3584,0.03242986599604289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,4096,0.037956265608469646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,1024,0.015203199783960977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,1536,0.018759467204411826
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,2048,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,768,0.01370133360226949
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,256,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,128,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,65536,512,0.011583999792734782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,10240,0.029286400477091475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,12288,0.03331306576728821
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,16384,0.04184746742248535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,8192,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,7168,0.02225493391354879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,6144,0.020397865772247316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,4096,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,5120,0.018480000893274943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,2560,0.012809600432713827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,3584,0.015210666259129844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,3072,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,1536,0.0098880002895991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,2048,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,256,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,128,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,12288,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,16384,0.03945813179016113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,10240,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,7168,0.021026132504145305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,6144,0.019578667481740315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,4096,0.015314132968584696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,5120,0.01753173271814982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,3072,0.013470932841300964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,3584,0.014393599828084311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,2048,0.010738133390744527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,2560,0.012344533205032348
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,1536,0.009474133451779682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,512,0.007835733393828075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,768,0.00824533353249232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,256,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,128,0.007054933408896129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,16384,0.03829760154088338
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,16384,65536,0.14185813268025715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,12288,0.030036266644795733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,8192,0.022664533058802287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,12288,65536,0.13073066870371503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,7168,0.02100373307863871
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,5120,0.017661867539087932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,6144,0.018897066513697304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,4096,0.014999467134475707
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,3072,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,3584,0.014381866653760275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,1536,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,2560,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,1024,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,512,0.007899733384450276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,256,0.007828266421953837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,128,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,12288,0.02969599962234497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,16384,0.03816106716791789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,10240,65536,0.12789759635925294
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,8192,0.022804266214370726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,6144,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,7168,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,5120,0.01745599905649821
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,3072,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,3584,0.013563733299573263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,4096,0.014801067113876343
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,2048,0.010391466816266378
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,2560,0.01165120005607605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,512,0.00793280005455017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,768,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,1024,0.008669867118199667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,128,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,12288,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,8192,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,7168,0.020937599738438926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,6144,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,5120,0.017352533340454102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,4096,0.014381866653760275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,3072,0.012337066729863485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,3584,0.013665067156155905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,2560,0.011548800269762675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,2048,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,1024,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,1536,0.00951573352018992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,256,0.007828266421953837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,128,0.007285333176453908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,8192,65536,0.12615573406219482
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,16384,0.03638720115025838
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,8192,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,6144,0.018478933970133463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,7168,0.02012373407681783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,7168,65536,0.1261567989985148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,4096,0.014390400052070618
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,5120,0.016432000199953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,3584,0.013160533706347146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,2560,0.011345066626866658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,3072,0.012377599875132244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,2048,0.010326400399208069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,256,0.007493333518505096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,128,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,12288,0.029191466172536214
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,10240,0.025600000222524004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,8192,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,7168,0.019933867454528808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,6144,0.0180896004041036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,5120,0.01602133313814799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,6144,65536,0.12663466930389405
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,3584,0.013195733229319254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,3072,0.012266666690508524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,1536,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,2048,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,2560,0.01165120005607605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,512,0.00782719999551773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,256,0.007593599955240886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,12288,0.02956266601880391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,16384,0.03618026574452718
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,10240,0.02553279995918274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,8192,0.02157333294550578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,7168,0.0201855997244517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,6144,0.0180021325747172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,5120,65536,0.12547413508097333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,4096,0.01397333343823751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,5120,0.016090666254361473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,3584,0.013194666306177775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,3072,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,2560,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,2048,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,1536,0.00953493316968282
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,128,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,512,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,4096,65536,0.1257472038269043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,6144,0.018071466684341432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,7168,0.0193066676457723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,4096,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,3584,0.013229866822560629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,5120,0.016042666633923848
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,3072,0.012436266740163167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,2560,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,2048,0.010327466328938802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,1536,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,512,0.0075647999842961625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,256,0.007461333274841308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,16384,0.03597653309504191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,65536,0.1253717343012492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,8192,0.02095680038134257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,7168,0.01966080069541931
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,6144,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,5120,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,3584,0.013222400347391763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,4096,0.01381119986375173
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,3072,0.01236799955368042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,2560,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,2048,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,1024,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,768,0.008250666658083598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,256,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,128,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3072,65536,0.12567893664042157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,16384,0.03604480028152466
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,12288,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,6144,0.01765973369280497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,4096,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,5120,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,3584,0.013160533706347146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,3072,0.012401066223780314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,2048,0.010300800204277039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,2560,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,1536,0.009507200121879578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,1024,0.008669867118199667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,128,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,16384,0.03549866676330567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2560,65536,0.12499626477559407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,10240,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,12288,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,5120,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,6144,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,3584,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,4096,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,3072,0.012171733379364013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,2560,0.011148800452550251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,768,0.00804373323917389
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,256,0.00739519993464152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,128,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,2048,65536,0.12462080319722493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,16384,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,12288,0.028262400627136232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,8192,0.020958934227625528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,3584,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,6144,0.01765973369280497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,5120,0.01609173317750295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,4096,0.01397333343823751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,3584,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,3072,0.012403200070063274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,1536,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,2048,0.010295466581980387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,2560,0.01120853324731191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,1024,0.008718933661778767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,768,0.008180266618728638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,256,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,16384,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1536,65536,0.12390399773915609
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,8192,0.02100480000178019
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,7168,0.019309866428375243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,5120,0.01568000018596649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,6144,0.01806933283805847
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,3584,0.013153066237767538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,3072,0.01236799955368042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,2560,0.011115733782450359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,1536,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,2048,0.010354133447011311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,1024,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,128,0.007046400010585785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,256,0.007050666709740956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,1024,65536,0.12158293724060058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,10240,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,7168,0.019297067324320474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,8192,0.020594133933385213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,6144,0.01732800006866455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,5120,0.016023466984430947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,3584,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,4096,0.013638400038083396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,3072,0.012026666601498922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,2560,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,1536,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,1024,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,65536,0.12247040271759033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,256,0.007425066828727722
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,768,128,0.007053866485754649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,12288,0.027852799495061236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,16384,0.03543039957682292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,10240,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,7168,0.019709867238998414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,8192,0.02095680038134257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,6144,0.017259732882181803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,4096,0.013570132851600646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,5120,0.016090666254361473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,3584,0.012785067160924276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,2560,0.01165120005607605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,3072,0.01200213332970937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,1536,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,1024,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,65536,0.11967253684997559
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,768,0.008215466638406117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,512,0.00803306649128596
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,256,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,512,128,0.007012266914049785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,16384,0.03543039957682292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,6144,0.017795199155807497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,7168,0.018898133436838785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,5120,0.015633066495259605
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,4096,0.013994666934013366
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,3584,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,65536,0.11919360160827637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,3072,0.012371200323104858
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,2560,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,2048,0.009985066453615824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,1536,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,1024,0.00871573289235433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,256,0.007054933408896129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,256,128,0.007046400010585785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,12288,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,65536,0.12117226918538411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,8192,0.020888533194859824
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,7168,0.019299199183781944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,6144,0.01732800006866455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,5120,0.016122666994730632
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,4096,0.013572266697883606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,3584,0.013190399607022604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,3072,0.011934933066368104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,2048,0.010295466581980387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,1536,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,768,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,1024,0.008283733328183492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,256,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,128,0.007014399766921997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,48,128,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,10240,0.07717546621958414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,12288,0.08915627002716064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,8192,0.06898346741994223
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,16384,0.1162922700246175
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,7168,0.0612010677655538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,6144,0.053179732958475744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,5120,0.04686506589253743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,3584,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,4096,0.037272532780965165
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,3072,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,2560,0.027102933327356978
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,1024,0.015336533387502035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,768,0.01407360037167867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,1536,0.01903466582298279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,2048,0.023277866840362548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,128,0.00906880001227061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,256,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,65536,512,0.01172160009543101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,10240,0.02908373276392619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,12288,0.03317760030428569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,16384,0.041915734608968094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,8192,0.024693334102630617
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,7168,0.022459733486175536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,6144,0.02046826680501302
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,4096,0.016090666254361473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,5120,0.01808746655782064
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,3584,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,3072,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,2560,0.012883200248082479
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,1024,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,1536,0.010288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,2048,0.01162559986114502
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,512,0.007894399762153625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,256,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,128,0.007394133508205414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,12288,0.03078826665878296
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,16384,0.03898026545842488
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,10240,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,7168,0.02135573426882426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,6144,0.01930026610692342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,4096,0.015268266201019287
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,5120,0.017258665959040322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,3072,0.013196800152460733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,3584,0.014383999506632486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,2048,0.010760533809661865
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,2560,0.012035199999809265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,1536,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,768,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,256,0.007485866546630859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,128,0.00739519993464152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,16384,0.03816106716791789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,16384,65536,0.14458880424499512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,12288,0.030377600590387983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,12288,65536,0.13124266465504963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,7168,0.020946133136749267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,5120,0.01766080061594645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,6144,0.019102933009465535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,3584,0.014074666301409402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,4096,0.015211733182271323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,3072,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,1536,0.009613866607348125
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,2048,0.010739200313886007
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,2560,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,1024,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,256,0.007427200178305308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,128,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,12288,0.029969066381454468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,16384,0.03741013209025065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,10240,0.02635093331336975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,10240,65536,0.12721493244171142
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,8192,0.022459733486175536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,6144,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,5120,0.017193599541982015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,3584,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,4096,0.014589866995811463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,2560,0.011549866199493409
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,3072,0.01244586706161499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,2048,0.010422399640083313
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,1024,0.00865600009759267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,768,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,256,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,512,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,128,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,16384,0.03686399857203166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,10240,0.025737599531809492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,65536,0.12622506618499757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,8192,0.022184532880783082
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,5120,0.016849066813786825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,6144,0.018819200992584228
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,4096,0.014424533645311991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,3584,0.013361066579818726
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,8192,7168,0.021233065923055013
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,2560,0.011450666189193725
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,3072,0.012716799974441528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,1024,0.008718933661778767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,1536,0.009878399968147277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,768,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,256,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,128,0.007086933155854543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,7168,65536,0.12663573424021404
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,10240,0.025668267409006757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,7168,0.020803199211756388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,4096,0.014519466956456503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,5120,0.016371200482050575
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,6144,0.018899200359980266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,2560,0.011150933305422465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,3584,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,3072,0.012339199582735699
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,1024,0.008661333719889324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,1536,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,2048,0.010397866368293762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,512,0.007895466685295106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,768,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,128,0.00738560010989507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,8192,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,7168,0.02059626579284668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,6144,0.018078933159510292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,4096,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,5120,0.016500266393025716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,3584,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,3072,0.012437333663304646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,2048,0.01069760024547577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,2560,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,1536,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,512,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,256,0.007485866546630859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,6144,65536,0.12547413508097333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,12288,0.028945066531499225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,10240,0.02519039909044902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,8192,0.02177600065867106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,5120,65536,0.12540586789449054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,6144,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,7168,0.019721599419911702
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,5120,0.015824000040690102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,3584,0.013154133160909017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,4096,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,2048,0.010319999853769938
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,2560,0.01120746632417043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,3072,0.011945600310961407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,1536,0.009476266304651896
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,256,0.00739519993464152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,16384,0.03645439942677815
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,8192,0.02177600065867106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,6144,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,7168,0.019594667355219524
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,4096,65536,0.12649813493092854
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,3584,0.013291733463605246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,4096,0.013979732990264893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,5120,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,2048,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,3072,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,2560,0.011217066645622253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,1024,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,768,0.008243200182914735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,512,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,256,0.007427200178305308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,12288,0.028331732749938963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3584,65536,0.12547413508097333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,10240,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,8192,0.021415466070175172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,5120,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,6144,0.017666133244832356
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,4096,0.01397119959195455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,3072,0.012000000476837159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,2560,0.011318399508794149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,2048,0.010718933741251628
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,1024,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,512,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,256,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,128,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,16384,0.03604373137156169
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,10240,0.02525866627693176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,8192,0.021346133947372437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,3072,65536,0.12581546306610109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,7168,0.019707733392715455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,6144,0.017681066195170084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,5120,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,4096,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,3584,0.01318826675415039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,3072,0.012001066406567892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,2048,0.010388267040252686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,256,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,10240,0.024984532594680788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2560,65536,0.12485973040262859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,7168,0.019502933820088705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,6144,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,5120,0.015689599514007568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,4096,0.01407360037167867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,3584,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,3072,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,2048,0.010309333602587383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,1024,0.008989866574605305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,128,0.007112533350785573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,12288,0.02805759906768799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,10240,0.024643200635910033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,2048,65536,0.12462080319722493
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,6144,0.017729065815607705
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,5120,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,3584,0.01318826675415039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,4096,0.013572266697883606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,2048,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,3072,0.011991467078526814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,1024,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,1536,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,512,0.00782719999551773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,128,0.007180800040562947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,16384,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1536,65536,0.12369919617970784
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,10240,0.0246453324953715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,7168,0.019170133272806804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,6144,0.017259732882181803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,5120,0.016160000363985697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,3072,0.012469333410263062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,4096,0.013702399532000222
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,3584,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,1536,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,2560,0.011583999792734782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,2048,0.010294399658838908
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,768,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,1024,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,256,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,1024,65536,0.12031893730163574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,12288,0.027852799495061236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,16384,0.03563520113627116
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,8192,0.020873600244522096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,7168,0.019367466370264687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,6144,0.01765973369280497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,5120,0.016029866536458333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,4096,0.01404159963130951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,3584,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,3072,0.01193386713663737
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,2048,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,768,0.008236800134181977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,1024,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,1536,0.009603200356165568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,512,0.007895466685295106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,128,0.007112533350785573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,256,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,768,65536,0.1206933339436849
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,10240,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,7168,0.019367466370264687
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,6144,0.017257599035898845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,4096,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,5120,0.015620266397794088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,3584,0.012854400277137756
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,3072,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,2560,0.01111253301302592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,2048,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,1536,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,1024,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,65536,0.11970559755961101
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,768,0.008215466638406117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,256,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,512,128,0.007011199990908305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,12288,0.027852799495061236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,16384,0.035633067289988204
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,6144,0.018071466684341432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,7168,0.018895999590555827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,5120,0.01568000018596649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,4096,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,3584,0.012786133090655008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,65536,0.11926186879475911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,3072,0.012403200070063274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,2560,0.011573333541552227
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,2048,0.010055466492970785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,1024,0.008718933661778767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,256,0.007396266857783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,256,128,0.007008000214894612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,12288,0.027853866418202717
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,65536,0.1203541358311971
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,7168,0.01930026610692342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,6144,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,5120,0.016084266702334087
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,4096,0.013570132851600646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,3584,0.01288106640179952
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,3072,0.011935999989509583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,2560,0.011585066715876263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,1536,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,768,0.008615466952323913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,512,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,256,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,1024,0.008243200182914735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,32,128,128,0.007111466427644093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,8192,0.07041707038879394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,10240,0.07970026334126791
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,12288,0.09058880011240641
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,7168,0.059903999169667564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,6144,0.052190931638081875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,16384,0.13165226777394612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,5120,0.0464906652768453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,4096,0.03781973520914714
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,3584,0.03256319959958394
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,2560,0.026624000072479247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,3072,0.030584534009297688
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,768,0.01432213286558787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,1024,0.01602133313814799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,2048,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,1536,0.019373865922292073
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,128,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,256,0.009944533308347065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,65536,512,0.011934933066368104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,10240,0.029080533981323244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,12288,0.03331413269042969
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,16384,0.04164160092671712
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,8192,0.024642133712768556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,7168,0.02211839954058329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,6144,0.020139733950297035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,4096,0.016088533401489257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,5120,0.01821546753247579
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,3072,0.014108799894650779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,3584,0.015205333630243937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,2560,0.012786133090655008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,1024,0.009066667159398396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,1536,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,2048,0.011618133385976155
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,768,0.008312533299128216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,256,0.007490133245786031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,12288,0.031129600604375203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,16384,0.03911679983139038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,10240,0.027170133590698243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,7168,0.021618133783340453
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,6144,0.019230933984120686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,4096,0.015406933426856995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,5120,0.017866667111714682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,3072,0.013563733299573263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,3584,0.014383999506632486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,2048,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,2560,0.012061867117881774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,1024,0.00871573289235433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,1536,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,512,0.007964799801508587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,256,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,16384,0.03795839945475261
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,16384,65536,0.15981225967407225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,12288,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,12288,65536,0.13052480220794677
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,7168,0.02094506621360779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,6144,0.019230933984120686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,5120,0.017271467049916587
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,3072,0.012821333607037863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,3584,0.014006400108337402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,4096,0.015244799852371215
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,2048,0.010354133447011311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,2560,0.011557333668073018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,768,0.008302933474381765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,256,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,128,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,12288,0.029421865940093994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,16384,0.0373418649037679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,10240,65536,0.12823893229166666
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,6144,0.01916159987449646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,5120,0.01725013256072998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,7168,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,3072,0.012410666545232136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,3584,0.013243732849756875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,4096,0.014860799908638
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,1536,0.00974079966545105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,2048,0.010423466563224792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,2560,0.011524266997973124
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,1024,0.00871573289235433
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,128,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,256,0.007521066566308339
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,8192,0.022457599639892578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,6144,0.018895999590555827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,5120,0.016657066345214844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,4096,0.014800000190734863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,3072,0.012342400352160136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,2048,0.01042133371035258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,2560,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,1536,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,256,0.0074869334697723385
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,8192,65536,0.12602026462554933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,12288,0.029150933027267456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,10240,0.02553173303604126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,8192,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,7168,0.020537600914637247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,6144,0.01848640044530233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,7168,65536,0.12670293649037678
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,4096,0.014393599828084311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,5120,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,3584,0.013290666540463767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,3072,0.012411733468373615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,2560,0.011215999722480774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,2048,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,12288,0.02921813329060872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,10240,0.025804799795150758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,8192,0.022167466084162393
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,7168,0.020278400182723998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,6144,0.018488534291585288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,5120,0.01637226641178131
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,6144,65536,0.1257130702336629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,3072,0.011963733037312825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,3584,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,2560,0.01120853324731191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,2048,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,1024,0.008718933661778767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,512,0.00780266672372818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,256,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,128,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,12288,0.029013333717981975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,16384,0.03638613224029541
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,10240,0.025462400913238526
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,8192,0.02177813251813253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,7168,0.020275199413299562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,6144,0.017934934298197428
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,5120,65536,0.1271125316619873
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,4096,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,5120,0.015621333320935567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,2560,0.011515733599662781
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,1024,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,768,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,128,0.0074527998765309645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,256,0.007294933497905731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,12288,0.02887786626815796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,65536,0.12540586789449054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,6144,0.017669334014256795
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,5120,0.016028799613316855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,4096,0.013979732990264893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,3584,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,3072,0.012378666798273723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,2048,0.010307199756304423
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,2560,0.011180800199508668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,65536,0.1262933333714803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,256,0.007427200178305308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3584,128,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,12288,0.02867199977238973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,8192,0.02109439969062805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,6144,0.017670400937398276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,4096,0.014016000429789224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,5120,0.015825066963831583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,3072,0.01200213332970937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,3584,0.012820266683896384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,2560,0.011126400033632914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,1024,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,512,0.00787199983994166
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,128,0.007054933408896129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,3072,65536,0.12595093250274658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,10240,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,12288,0.02874133388201396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,7168,0.0193066676457723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,6144,0.018090667327245076
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,5120,0.016028799613316855
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,4096,3072,0.0123690664768219
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,4096,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,3584,0.01316159963607788
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,3072,0.011994666854540507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,2560,0.011538133025169373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,1536,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,1024,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,768,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,512,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,256,0.007522133489449819
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,128,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2560,65536,0.12499626477559407
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,16384,0.03618133465449015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,10240,0.02471359968185425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,7168,0.01957226594289144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,6144,0.017668267091115318
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,5120,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,4096,0.014109866817792258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,2560,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,3072,0.012026666601498922
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,3584,0.013195733229319254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,1536,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,1024,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,2048,0.010762666662534077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,768,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,12288,0.028537599245707194
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,16384,0.035358933607737224
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,6144,0.017731199661890663
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,4096,0.01399786671002706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,5120,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,2048,65536,0.1237674633661906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,3584,0.01318826675415039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,3072,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,2560,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,1536,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,2048,0.010424533486366272
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,1024,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,512,0.007850666840871174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,256,0.00739519993464152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,128,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1536,65536,0.1232917308807373
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,16384,0.03515733480453491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,8192,0.02094506621360779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,7168,0.018899200359980266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,5120,0.015620266397794088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,6144,0.017656532923380534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,4096,0.013639466961224875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,3072,0.012027733524640401
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,3584,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,2560,0.011150933305422465
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,2048,0.010288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,1024,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,768,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,512,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,256,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,128,0.007012266914049785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,1024,65536,0.1213098684946696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,16384,0.034883201122283936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,8192,0.02095680038134257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,7168,0.018898133436838785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,6144,0.017730132738749186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,5120,0.01602133313814799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,4096,0.013585066795349121
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,3584,0.01325440009435018
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,3072,0.012029866377512615
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,2560,0.01111466685930888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,768,0.00864533285299937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,1024,0.008249600231647492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,65536,0.11984000205993653
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,128,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,768,256,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,6144,0.017257599035898845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,4096,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,5120,0.015681067109107973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,3584,0.012822399536768595
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,2560,0.01120746632417043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,3072,0.0123989333709081
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,2048,0.009900800387064616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,1536,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,1024,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,768,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,65536,0.11933120091756184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,512,0.00782719999551773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,512,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,16384,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,7168,0.019298134247461955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,6144,0.01766293247540792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,65536,0.11909333070119221
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,5120,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,4096,0.013639466961224875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,3584,0.013153066237767538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,3072,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,2560,0.011516799529393513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,2048,0.009954133629798889
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,1536,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,1024,0.008313600222269695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,512,0.007828266421953837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,128,0.00721919983625412
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,16384,0.034883201122283936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,65536,0.1189237356185913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,7168,0.019299199183781944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,6144,0.017612799008687337
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,5120,0.015681067109107973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,4096,0.013674666484196981
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,3584,0.012847999731699625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,2560,0.011174399654070537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,3072,0.011935999989509583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,2048,0.010286933183670044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,128,0.007046400010585785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,128,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,16,256,8192,0.021348265806833903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,12288,0.09564159711201986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,8192,0.07000746726989746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,10240,0.0818176031112671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,16384,0.11912533442179363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,7168,0.059835731983184814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,6144,0.055912534395853676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,5120,0.046830932299296066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,4096,0.03816106716791789
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,3072,0.03174399932225545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,2560,0.02764799992243449
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,3584,0.033655468622843424
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,2048,0.023483733336130776
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,512,0.011617066462834676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,768,0.014425599575042724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,256,0.009945600231488546
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,128,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,1024,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,65536,1536,0.02018346587816874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,10240,0.029080533981323244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,12288,0.03379199902216594
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,16384,0.046353065967559816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,8192,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,6144,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,5120,0.01848213275273641
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,4096,0.016235733032226564
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,2560,0.012957866986592612
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,3584,0.015825066963831583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,3072,0.014108799894650779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,1024,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,1536,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,2048,0.011285332838694255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,768,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,512,0.007906133433183034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,256,0.007394133508205414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,128,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,12288,0.031197865804036457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,16384,0.03863893349965413
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,10240,0.026895999908447266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,8192,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,7168,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,6144,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,4096,0.015211733182271323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,5120,0.017796266078948974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,3072,0.013292800386746725
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,3584,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,2048,0.010397866368293762
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,2560,0.012027733524640401
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,1024,0.009054932991663616
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,768,0.008516266942024231
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,128,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,16384,0.03809386491775513
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,16384,65536,0.14759252866109213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,12288,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,10240,0.026077866554260254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,12288,65536,0.13052586714426678
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,5120,0.017257599035898845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,7168,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,6144,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,3072,0.013597866892814637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,3584,0.01397333343823751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,4096,0.015001599987347921
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,2048,0.010423466563224792
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,2560,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,768,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,256,0.007485866546630859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,128,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,16384,0.03741013209025065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,10240,0.025873066981633504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,10240,65536,0.12683946291605633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,6144,0.018894932667414346
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,5120,0.017593600352605186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,7168,0.020807466904322305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,3072,0.012379733721415202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,3584,0.014074666301409402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,4096,0.014393599828084311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,2048,0.010763733585675558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,2560,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,768,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,256,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,128,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,12288,0.02921813329060872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,16384,0.0373418649037679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,10240,0.025804799795150758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,8192,0.022574933369954427
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,7168,0.020547199249267577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,6144,0.019093332688013713
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,4096,0.014791466792424521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,5120,0.016850133736928306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,3584,0.013972266515096029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,3072,0.01200213332970937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,2560,0.01165226697921753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,1024,0.009030399719874065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,768,0.008472533027331034
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,8192,65536,0.12574613094329834
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,128,0.007114666700363159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,12288,0.029148799180984498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,10240,0.02553173303604126
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,7168,0.020411733786265054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,6144,0.01895786722501119
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,7168,65536,0.12602026462554933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,5120,0.016089600324630738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,4096,0.014382933576901754
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,3584,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,2560,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,3072,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,1536,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,256,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,128,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,10240,0.025872000058492023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,8192,0.02211839954058329
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,7168,0.020665599902470907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,6144,0.018145066499710084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,4096,0.013979732990264893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,5120,0.01684053341547648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,3584,0.012823466459910074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,3072,0.012437333663304646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,6144,65536,0.12540586789449054
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,2048,0.01069546639919281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,2560,0.011215999722480774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,1024,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,128,0.007454933226108551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,12288,0.029079467058181763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,16384,0.03652266661326091
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,8192,0.02198293407758077
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,7168,0.019853866100311278
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,6144,0.0181386669476827
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,5120,65536,0.12526933352152508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,4096,0.014042666554450989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,3584,0.01318826675415039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,5120,0.016032000382741295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,2560,0.011175466577212016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,3072,0.012436266740163167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,128,0.007180800040562947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,256,0.007086933155854543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,7168,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,6144,0.017798399925231932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,4096,65536,0.12506453196207684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,3584,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,4096,0.013972266515096029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,5120,0.015896532932917276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,2560,0.01120746632417043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,2048,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,3072,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,1536,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,768,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,256,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,128,0.007052800059318543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3584,65536,0.12636160055796306
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,10240,0.02532586654027303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,8192,0.021435733636220297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,5120,0.015621333320935567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,7168,0.019797333081563315
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,6144,0.017467733224232992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,3584,0.01325866679350535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,3072,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,4096,0.013982933759689332
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,2560,0.011617066462834676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,2048,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,768,0.00844266712665558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,128,0.007077333331108093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,256,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,8192,0.021415466070175172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,3072,65536,0.12506346702575682
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,7168,0.019308799505233766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,6144,0.018071466684341432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,5120,0.01568000018596649
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,4096,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,3072,0.011989333232243856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,2560,0.011217066645622253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,1536,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,768,0.008308266599973042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,256,0.0075573335091273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,12288,0.027990400791168213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,16384,0.03590826590855916
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2560,65536,0.12482666969299316
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,7168,0.01890773375829061
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,6144,0.017730132738749186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,5120,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,3072,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,2560,0.011549866199493409
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,768,0.008648533622423809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,1024,0.00865600009759267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,256,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,10240,0.024576000372568765
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,2048,65536,0.12387093702952068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,7168,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,6144,0.017730132738749186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,5120,0.015682133038838704
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,4096,0.013573333621025085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,2560,0.011582932869593303
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,2048,0.01033066709836324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,3072,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,1024,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,1536,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,128,0.007077333331108093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,256,0.007427200178305308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,12288,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,16384,0.0357045332590739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1536,65536,0.12212906678517658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,10240,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,7168,0.018898133436838785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,6144,0.017259732882181803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,5120,0.016090666254361473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,4096,0.013640532890955607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,3072,0.012436266740163167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,3584,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,2048,0.010553600390752156
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,1536,0.009099733829498292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,2560,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,1024,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,768,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,512,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,256,0.0074890668193499255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,1024,65536,0.12004693349202473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,12288,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,16384,0.035361067454020186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,8192,0.020549333095550536
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,7168,0.019364267587661743
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,6144,0.017661867539087932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,5120,0.015621333320935567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,4096,0.014108799894650779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,3584,0.01276586651802063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,3072,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,1536,0.009533866246541341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,1024,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,256,0.007017600039641063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,128,0.007012266914049785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,768,65536,0.11967146396636963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,10240,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,8192,0.02095680038134257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,7168,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,6144,0.017258665959040322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,5120,0.015677866339683533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,4096,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,3584,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,3072,0.012060800194740295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,2560,0.010811733206113179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,2048,0.010295466581980387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,1536,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,1024,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,65536,0.1210367997487386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,768,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,256,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,512,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,12288,0.027852799495061236
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,10240,0.025054933627446492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,16384,0.034883201122283936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,6144,0.017321600516637167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,7168,0.019708800315856933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,4096,0.014409599701563516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,5120,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,3584,0.012753066420555115
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,65536,0.11919253667195637
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,2560,0.01120746632417043
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,3072,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,2048,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,1536,0.009475200374921163
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,768,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,512,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,256,0.0071050668756167095
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,256,128,0.007114666700363159
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,16384,0.03447573184967041
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,65536,0.12032000223795573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,7168,0.01930026610692342
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,5120,0.016089600324630738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,6144,0.017258665959040322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,4096,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,3584,0.012813867131868998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,3072,0.012404266993204753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,2560,0.011116799712181092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,1536,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,768,0.007835733393828075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,256,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,512,0.007494399944941203
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,8,128,128,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,8192,0.07321600119272867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,10240,0.07942933241526286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,12288,0.0934229294459025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,7168,0.06441173156102499
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,6144,0.05321493148803711
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,16384,0.12438186804453533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,5120,0.04526079893112182
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,4096,0.040278398990631105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,3584,0.03536213239034017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,2560,0.026009599367777508
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,3072,0.03242666721343994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,1024,0.016498133540153503
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,2048,0.024985599517822265
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,768,0.014803199966748556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,128,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,1536,0.019718400637308755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,256,0.010354133447011311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,65536,512,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,10240,0.03031040032704671
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,12288,0.03345066706339518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,16384,0.04990293184916179
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,8192,0.025804799795150758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,7168,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,6144,0.022177066405614218
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,5120,0.018478933970133463
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,4096,0.01625920037428538
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,2560,0.013154133160909017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,3584,0.01644266645113627
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,3072,0.014043733477592468
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,1024,0.009061333537101746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,1536,0.010732799768447876
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,2048,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,768,0.008377599716186523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,256,0.007626666625340779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,128,0.007012266914049785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,512,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,12288,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,16384,0.038571735223134354
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,8192,0.022937599817911783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,7168,0.020946133136749267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,6144,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,4096,0.015340800086657206
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,5120,0.017670400937398276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,3072,0.013296000162760415
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,3584,0.014453333616256715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,2048,0.010357333223025005
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,2560,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,1024,0.008691199620564779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,1536,0.009603200356165568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,512,0.007850666840871174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,256,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,16384,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,16384,65536,0.14895787239074706
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,12288,0.02996693253517151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,12288,65536,0.12998080253601074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,5120,0.01766080061594645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,7168,0.020889600118001304
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,6144,0.019032533963521323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,3072,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,3584,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,4096,0.015370666980743408
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,1536,0.009533866246541341
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,2048,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,2560,0.011558399597803751
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,1024,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,256,0.007485866546630859
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,128,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,16384,0.03775146802266439
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,10240,0.02600853244463603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,10240,65536,0.12690773010253906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,8192,0.022801067431767783
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,6144,0.01889066696166992
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,5120,0.017249067624409996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,3072,0.012807466586430869
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,3584,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,4096,0.014453333616256715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,1536,0.009467732906341553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,2048,0.01032319962978363
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,2560,0.01165226697921753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,512,0.007895466685295106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,256,0.007418666779994964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,128,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,12288,0.02955946723620097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,16384,0.03659093379974365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,10240,0.026667733987172444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,8192,0.022323199113210044
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,7168,0.021005866924921672
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,6144,0.01854613423347473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,5120,0.017249067624409996
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,4096,0.014381866653760275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,3072,0.01202880044778188
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,3584,0.01363200048605601
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,2048,0.01072746713956197
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,2560,0.011173333724339802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,1024,0.00864746669928233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,1536,0.009877333045005798
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,512,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,256,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,8192,65536,0.12588373025258381
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,10240,0.025600000222524004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,7168,0.020125865936279297
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,6144,0.019026132424672444
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,7168,65536,0.1261567989985148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,4096,0.01455466647942861
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,5120,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,3584,0.013195733229319254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,3072,0.012403200070063274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,2560,0.011127466956774395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,1536,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,2048,0.01032960017522176
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,256,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,128,0.006985599795977275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,16384,0.03618133465449015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,65536,0.12581546306610109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,10240,0.02573653260866801
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,7168,0.019990400473276774
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,8192,0.022025599082310995
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,5120,0.016023466984430947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,6144,0.018284799655278523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,4096,0.013972266515096029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,3584,0.012819199760754903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,3072,0.012403200070063274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,2560,0.01111466685930888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,2048,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,768,0.008242133259773254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,256,0.007417599856853485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,128,0.007077333331108093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,5120,65536,0.12506453196207684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,6144,0.017667200167973837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,6144,768,0.008410666386286418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,5120,0.01602453291416168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,4096,0.013844266533851624
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,3584,0.013255467017491659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,3072,0.01209493378798167
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,2560,0.011148800452550251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,1536,0.009538132945696514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,1024,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,2048,0.01076479951540629
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,128,0.007112533350785573
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,16384,0.03611413240432739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,10240,0.02539413372675578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,8192,0.021434666713078816
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,4096,65536,0.1261567989985148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,7168,0.020119466384251914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,5120,0.015890133380889893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,6144,0.017667200167973837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,3584,0.012820266683896384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,4096,0.014074666301409402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,3072,0.011934933066368104
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,2048,0.010492799679438274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,2560,0.011148800452550251
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,1024,0.00878613293170929
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,768,0.007977599898974102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,256,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,12288,0.028808534145355225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,16384,0.03618133465449015
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3584,65536,0.1249621311823527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,8192,0.021708800395329794
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,6144,0.01765973369280497
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,5120,0.016090666254361473
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,3072,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,3584,0.013222400347391763
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,4096,0.013972266515096029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,1536,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,2560,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,768,0.008682666222254436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,128,0.007046400010585785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,256,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,16384,0.0362496018409729
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,65536,0.12506453196207684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,8192,0.021346133947372437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,7168,0.019368533293406168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,6144,0.017259732882181803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,5120,0.016125866770744325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,4096,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,3584,0.013221333424250284
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,3072,0.011969066659609477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,2560,0.011334400375684102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,1536,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,512,0.0074314668774604796
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,128,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2560,65536,0.12451840241750081
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,12288,0.02826133370399475
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,16384,0.03542933464050293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,8192,0.020946133136749267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,6144,0.01726186672846476
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,5120,0.01602453291416168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,4096,0.013636266191800436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,3584,0.013050666451454163
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,3072,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,2560,0.011106133460998535
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,1536,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,1024,0.008319999774297078
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,768,0.008242133259773254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,512,0.007835733393828075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,256,0.007421866556008657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,128,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,16384,0.035293865203857425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,2048,65536,0.12154666582743327
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,10240,0.024710400899251302
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,8192,0.02136639952659607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,7168,0.018899200359980266
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,6144,0.01772586703300476
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,5120,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,4096,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,3584,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,3072,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,2560,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,2048,0.010494933525721232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,1536,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,65536,0.12134400208791096
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,1024,0.00885653297106425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,768,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,512,0.007864533364772797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1536,128,0.006986666719118755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,8192,0.020606933037439983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,10240,0.02505279978116353
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,6144,0.017661867539087932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,7168,0.018898133436838785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,5120,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,4096,0.013572266697883606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,3584,0.013220266501108805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,3072,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,2048,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,65536,0.12014933427174886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,1536,0.009467732906341553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,1024,0.008281599978605907
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,512,0.007898666461308797
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,128,0.007079466680685679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,256,0.007155199845631917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,12288,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,10240,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,3072,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,65536,0.12137813568115234
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,6144,0.017832533518473307
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,5120,0.01565333306789398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,4096,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,3584,0.012776533762613932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,3072,0.012356266379356384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,2560,0.010795733332633973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,2048,0.010494933525721232
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,1024,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,768,0.007850666840871174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,512,0.007999999821186066
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,256,0.007085866729418437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,128,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,16384,0.03536213239034017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,10240,0.024711465835571288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,8192,0.021347200870513915
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,65536,0.11933013598124187
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,7168,0.019708800315856933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,6144,0.017259732882181803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,5120,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,4096,0.013595733046531677
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,3584,0.013288533687591553
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,3072,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,2560,0.011492266257603963
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,2048,0.010297600428263347
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,1536,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,768,0.00830506682395935
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,1024,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,512,0.007895466685295106
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,256,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,512,128,0.007042133311430614
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,16384,0.03543039957682292
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,65536,0.11878399848937989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,10240,0.02471359968185425
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,8192,0.020536533991495767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,7168,0.019729065895080566
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,5120,0.016124799847602844
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,6144,0.017259732882181803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,4096,0.014108799894650779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,3584,0.01276586651802063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,3072,0.012403200070063274
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,2560,0.011115733782450359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,2048,0.010696533322334289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,1536,0.00906773308912913
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,1024,0.009052800138791402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,512,0.007928533355395
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,768,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,256,128,0.006678399940331777
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,65536,0.12014933427174886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,8192,0.020947200059890748
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,7168,0.019708800315856933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,5120,0.016089600324630738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,6144,0.01732906699180603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,4096,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,3584,0.01276693344116211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,3072,0.01269653340180715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,2560,0.010706133643786113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,1024,0.009059199690818786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,512,0.008102400104204814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,768,0.00790826678276062
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,256,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,128,128,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,1024,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,4,768,7168,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,8192,0.07178239822387696
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,12288,0.09164586861928305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,10240,0.07594453493754069
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,16384,0.1374890645345052
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,5120,0.04826346635818481
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,6144,0.04932159980138143
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,7168,0.060141865412394205
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,4096,0.04082346757253011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,2560,0.02867199977238973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,3072,0.031196800867716472
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,3584,0.035702399412790936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,1024,0.01623466710249583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,768,0.014407466848691305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,256,0.009946667154630025
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,1536,0.020821332931518555
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,512,0.011591466267903645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,128,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,65536,2048,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,10240,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,12288,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,16384,0.04802560011545817
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,8192,0.024233599503835045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,7168,0.023142399390538533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,6144,0.022652800877889
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,4096,0.016452266772588094
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,5120,0.018480000893274943
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,3072,0.014061866203943887
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,3584,0.01643946667512258
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,2560,0.013155200084050498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,1024,0.009126399954160053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,1536,0.010445866982142131
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,2048,0.011549866199493409
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,768,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,256,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,128,0.007249066730340321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,512,0.00790719985961914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,12288,0.03037866751352946
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,16384,0.03925333420435588
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,10240,0.026692267258961993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,8192,0.023415466149648033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,7168,0.020958934227625528
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,6144,0.019777067502339683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,5120,0.017602133750915527
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,4096,0.01564479966958364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,3072,0.013220266501108805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,3584,0.014425599575042724
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,2560,0.011971199512481689
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,1536,0.009947733084360758
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,512,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,128,0.007086933155854543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,16384,0.037956265608469646
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,16384,65536,0.14943572680155437
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,12288,0.029832533995310467
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,10240,0.026282666126887004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,12288,65536,0.13168853123982746
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,8192,0.022528000672658286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,5120,0.017391999562581383
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,7168,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,6144,0.01909546653429667
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,3584,0.014014933506647745
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,3072,0.012745599945386252
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,4096,0.014800000190734863
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,1536,0.009478400150934856
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,2048,0.010354133447011311
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,2560,0.011523200074831645
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,768,0.008309333523114523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,128,0.007011199990908305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,12288,0.02921813329060872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,16384,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,10240,0.02614506681760152
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,10240,65536,0.12745386759440105
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,5120,0.016979199647903443
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,6144,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,7168,0.02068586746851603
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,3072,0.012341333429018657
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,3584,0.013814399639765421
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,4096,0.014794666568438211
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,1536,0.009603200356165568
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,2048,0.010831999778747558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,2560,0.011181867122650147
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,128,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,16384,0.03700053294499715
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,10240,0.025943466027577716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,7168,0.020874667167663574
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,6144,0.019299199183781944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,5120,0.016849066813786825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,4096,0.015067733327547708
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,3584,0.01316266655921936
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,3072,0.012467199563980102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,2048,0.01069546639919281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,2560,0.01121493379275004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,1024,0.008624000350634257
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,1536,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,512,0.007931733131408691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,256,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,8192,65536,0.12581546306610109
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,12288,0.029150933027267456
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,16384,0.03659093379974365
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,10240,0.025600000222524004
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,8192,0.02218666672706604
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,7168,0.020127999782562255
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,6144,0.018488534291585288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,7168,65536,0.1257813294728597
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,4096,0.013980799913406372
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,5120,0.016438399751981102
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,3584,0.013152000308036805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,3072,0.012001066406567892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,2560,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,2048,0.010388267040252686
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,256,0.007417599856853485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,512,0.007837866743405659
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,128,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,12288,0.02914773424466451
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,16384,0.036183468500773114
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,8192,0.021833600600560506
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,7168,0.020119466384251914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,6144,0.018076799313227334
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,5120,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,6144,65536,0.1265664021174113
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,3072,0.012001066406567892
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,3584,0.013155200084050498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,2560,0.011583999792734782
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,2048,0.01029973328113556
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,768,0.008243200182914735
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,1024,0.008713600039482117
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,256,0.007456000149250031
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,128,0.007417599856853485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,12288,0.02921813329060872
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,16384,0.03611413240432739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,10240,0.025872000058492023
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,8192,0.02177706758181254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,7168,0.020116267601648967
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,6144,0.018068265914916993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,5120,65536,0.12567893664042157
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,4096,0.013972266515096029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,3584,0.013024000326792398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,5120,0.01609173317750295
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,2048,0.010692266623179118
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,2560,0.011126400033632914
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,3072,0.012025599678357441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,768,0.008236800134181977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,1024,0.008657067020734151
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,1536,0.009539199868837993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,128,0.007077333331108093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,256,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,12288,0.028945066531499225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,16384,0.036111998558044436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,7168,0.019717333714167277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,6144,0.017661867539087932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,4096,65536,0.12513173421223958
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,4096,0.01397119959195455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,5120,0.015622400244077048
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,3584,0.01285653313000997
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,2560,0.011146666606267293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,3072,0.011992533008257549
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,768,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,1536,0.00942080020904541
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,1024,0.008259200056393941
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,256,0.0072202667593956
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,128,0.006984533369541168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3584,65536,0.1263967990875244
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,8192,0.0212991992632548
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,7168,0.019707733392715455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,5120,0.015621333320935567
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,6144,0.017670400937398276
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,4096,0.014040533701578775
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,3584,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,3072,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,2048,0.01033066709836324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,1536,0.009477333227793375
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,2560,0.011548800269762675
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,512,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,256,0.007523199915885926
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,12288,0.02874133388201396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,8192,0.021367466449737547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,3072,65536,0.1252010663350423
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,7168,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,6144,0.018067200978597008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,5120,0.01575146714846293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,4096,0.013777066270510355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,3584,0.01325653294722239
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,3072,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,2048,0.010717866818110149
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,2560,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,1536,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,512,0.007831466694672901
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,256,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,128,0.0070783997575442
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,65536,0.12322133382161457
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,12288,0.0279914657274882
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,6144,0.017661867539087932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,7168,0.0193066676457723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,5120,0.016023466984430947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,4096,0.013707733154296875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,3584,0.013187199831008911
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,3072,0.011940266688664753
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,2560,0.011241599917411804
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,2048,0.010295466581980387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,1536,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,1024,0.0083146666487058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,512,0.007849599917729695
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,256,0.007483733197053273
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,128,0.006984533369541168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2048,65536,0.12397226492563884
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,16384,0.035292800267537436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,10240,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,8192,0.02094506621360779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,7168,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,6144,0.017292799552281697
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,5120,0.015620266397794088
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,4096,0.013640532890955607
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,3584,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,3072,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,2560,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,1536,0.009272533655166625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,1024,0.008246399958928426
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,768,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,512,0.007430399954319
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,256,0.007359999914964039
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,128,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1536,65536,0.12206079959869384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,10240,0.02430079976717631
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,8192,0.02053440014521281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,7168,0.019301333030064902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,6144,0.01726186672846476
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,5120,0.015681067109107973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,4096,0.01360426644484202
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,3584,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,3072,0.011967999736467998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,2560,0.01114026705423991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,2048,0.009886933366457622
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,65536,0.12014826933542888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,1536,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,1024,0.008521599570910136
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,512,0.00782719999551773
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,768,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,128,0.007011199990908305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,1024,256,0.007054933408896129
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,12288,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,16384,0.03515733480453491
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,10240,0.024235733350118003
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,7168,0.019298134247461955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,6144,0.017257599035898845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,5120,0.015681067109107973
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,4096,0.013572266697883606
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,65536,0.1197386662165324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,3584,0.012970667084058127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,3072,0.01153600017229716
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,2048,0.010422399640083313
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,2560,0.011147733529408772
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,1536,0.009204266468683879
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,768,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,768,256,0.007052800059318543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,8192,0.02053546706835429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,10240,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,7168,0.01890986760457357
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,6144,0.017259732882181803
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,5120,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,4096,0.01360640029112498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,65536,0.11973973115285237
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,3584,0.012787200013796487
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,2560,0.011173333724339802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,3072,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,2048,0.009898666540781658
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,1536,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,1024,0.008283733328183492
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,768,0.007835733393828075
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,512,0.007828266421953837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,256,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,512,128,0.0070165331164995836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,65536,0.11933120091756184
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,8192,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,7168,0.0193066676457723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,6144,0.01732053359349569
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,5120,0.015622400244077048
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,4096,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,3584,0.013154133160909017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,3072,0.011947733163833619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,2560,0.011146666606267293
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,2048,0.010288000106811523
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,1536,0.009134933352470398
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,768,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,1024,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,256,0.007418666779994964
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,512,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,256,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,65536,0.11929600238800049
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,10240,0.024233599503835045
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,8192,0.02053546706835429
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,7168,0.019299199183781944
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,6144,0.017258665959040322
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,5120,0.015687466661135355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,4096,0.013972266515096029
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,3584,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,2560,0.011240532994270325
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,2048,0.009987200299898785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,1536,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,1024,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,512,0.007495466868082683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,256,0.007113599777221679
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,128,0.006985599795977275
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,2560,1024,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,2,128,3072,0.011935999989509583
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,10240,0.08266987005869547
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,12288,0.0935914675394694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,8192,0.06761813163757324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,16384,0.12199253241221111
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,7168,0.06427306731541951
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,6144,0.055978667736053464
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,5120,0.04642133315404256
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,3584,0.03679573138554891
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,4096,0.039255468050638835
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,3072,0.03290453354517619
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,2560,0.027236266930898027
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,1024,0.016781866550445557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,768,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,1536,0.020343466599782308
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,128,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,256,0.009920000036557516
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,512,0.011898666620254517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,65536,2048,0.02471253275871277
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,10240,0.028602667649586994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,12288,0.034542934099833174
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,16384,0.048196268081665036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,8192,0.024098134040832518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,7168,0.02307413419087728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,6144,0.022106667359670006
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,4096,0.01644053359826406
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,5120,0.018481065829594932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,3584,0.016301866372426352
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,3072,0.014391466975212097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,2560,0.012983466188112894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,1024,0.009127466877301534
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,2048,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,1536,0.009918933113416035
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,768,0.008694400389989216
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,256,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,512,0.007840000092983246
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,12288,0.030377600590387983
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,16384,0.038365864753723146
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,10240,0.026760532458623247
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,8192,0.023005867004394533
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,7168,0.021348265806833903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,6144,0.0193066676457723
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,5120,0.017933867375055947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,4096,0.015211733182271323
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,3072,0.013175466656684875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,3584,0.014791466792424521
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,2048,0.011105066537857056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,2560,0.011878400047620138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,1536,0.009876267115275065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,512,0.007891199986139933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,768,0.008250666658083598
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,256,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,128,0.007052800059318543
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,16384,0.0375488003094991
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,16384,65536,0.1482752005259196
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,12288,0.029766400655110676
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,10240,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,12288,65536,0.13134506543477376
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,7168,0.02068480054537455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,5120,0.01726079980532328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,6144,0.01904639999071757
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,3584,0.01360640029112498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,3072,0.01275200049082438
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,4096,0.015201066931088766
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,1536,0.009537067015965779
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,2048,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,2560,0.011623467008272808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,1024,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,768,0.008248533308506011
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,256,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,12288,0.029627732435862225
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,10240,0.025941334168116253
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,10240,65536,0.12752319971720377
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,7168,0.020616533358891805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,5120,0.017116800944010416
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,6144,0.01936639944712321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,3072,0.012779733538627625
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,3584,0.013393066326777139
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,4096,0.014459733168284097
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,2048,0.010307199756304423
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,2560,0.011550933122634888
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,768,0.008247466882069905
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,512,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,1024,0.008678399523099263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,128,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,256,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,10240,0.025601067145665485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,7168,0.02054826617240906
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,6144,0.01936639944712321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,5120,0.016436266899108886
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,4096,0.014858667055765787
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,3584,0.013196800152460733
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,3072,0.012354133526484172
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,2048,0.010834133625030518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,2560,0.011181867122650147
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,1536,0.009539199868837993
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,1024,0.00865600009759267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,768,0.00837546686331431
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,256,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,128,0.0072053333123524976
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,8192,65536,0.12560959657033283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,16384,0.0369322657585144
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,10240,0.0258026659488678
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,8192,0.02259626587231954
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,6144,0.018820265928904213
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,7168,0.020138667027155558
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,7168,65536,0.1254752000172933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,4096,0.014046933253606161
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,5120,0.016839466492335
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,3584,0.013152000308036805
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,3072,0.012288000186284382
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,2560,0.011562666296958924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,2048,0.010389332969983418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,1024,0.008716799815495809
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,768,0.008242133259773254
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,512,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,256,0.007020799815654755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,128,0.007011199990908305
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,12288,0.029149866104125975
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,16384,0.03611413240432739
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,10240,0.025463465849558515
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,8192,0.021356799205144248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,7168,0.019933867454528808
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,6144,0.01801066597302755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,5120,0.01602133313814799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,6144,65536,0.12602026462554933
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,3072,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,3584,0.013156267007191977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,2560,0.011115733782450359
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,1536,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,2048,0.010296533505121868
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,512,0.007838933169841767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,128,0.007075199981530507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,256,0.00729066679875056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,12288,0.028739200035731
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,16384,0.03624746799468994
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,10240,0.02532800038655599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,8192,0.02136853337287903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,7168,0.019718400637308755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,6144,0.0178656001885732
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,5120,65536,0.1268053372701009
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,4096,0.013974400361378989
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,3584,0.013223466277122498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,5120,0.016030933459599814
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,2048,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,2560,0.011515733599662781
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,3072,0.011994666854540507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,768,0.008238933483759562
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,1024,0.008717866738637288
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,1536,0.009489066402117411
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,128,0.0070165331164995836
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,256,0.0074879998962084455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,12288,0.02874133388201396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,16384,0.03658986488978068
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,8192,0.021824000279108684
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,7168,0.019504000743230186
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,6144,0.01813653310139974
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,4096,65536,0.1249951998392741
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,4096,0.014017066359519959
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,5120,0.016023466984430947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,3584,0.012786133090655008
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,2560,0.011242666840553283
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,2048,0.010295466581980387
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,3072,0.012429866194725036
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,768,0.008306133250395458
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,1536,0.009468799829483033
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,1024,0.008659199873606364
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,512,0.007828266421953837
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,256,0.007386666536331177
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,128,0.006986666719118755
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,12288,0.02874133388201396
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,16384,0.0361130674680074
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3584,65536,0.12547413508097333
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,10240,0.02539413372675578
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,8192,0.02134079933166504
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,5120,0.016023466984430947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,6144,0.01732800006866455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,3584,0.012811733285586038
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,3072,0.01193173329035441
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,4096,0.013981866836547851
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,1536,0.009475200374921163
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,2560,0.011174399654070537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,2048,0.010328533252080281
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,768,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,512,0.007428266604741414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,128,0.007076266904671986
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,256,0.007088000078996022
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,12288,0.02874026695887248
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,16384,0.036111998558044436
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,10240,0.024778666098912557
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,3072,65536,0.12673707008361818
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,7168,0.019319466749827065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,6144,0.017661867539087932
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,5120,0.016023466984430947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,3584,0.012880000472068786
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,4096,0.013573333621025085
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,3072,0.012356266379356384
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,2048,0.010301867127418518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,2560,0.011173333724339802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,1536,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,768,0.008274133503437042
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,1024,0.008658132950464885
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,512,0.007896533111731212
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,256,0.007420800129572551
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,128,0.007018666466077168
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,12288,0.027784534295399982
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,10240,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2560,65536,0.1240063985188802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,7168,0.01925119956334432
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,6144,0.017681066195170084
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,5120,0.015619200468063355
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,3584,0.012813867131868998
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,3072,0.011969066659609477
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,4096,0.013571199774742127
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,2560,0.011174399654070537
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,2048,0.010308266679445902
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,1024,0.00865066647529602
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,768,0.00787306676308314
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,256,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,128,0.007009066641330719
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,16384,0.03536213239034017
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,65536,0.12301653226216633
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,8192,0.021348265806833903
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,10240,0.02474666635195414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,7168,0.019709867238998414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,6144,0.017273600896199545
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,4096,0.013630933562914529
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,5120,0.01602240006128947
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,3584,0.012844799955685934
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,3072,0.012402133146921793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,2048,0.010696533322334289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,2560,0.01120853324731191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,1024,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,1536,0.0095360000928243
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,65536,0.1210367997487386
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,768,0.008241066833337148
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,512,0.007897600034872691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,256,0.007051733136177063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1536,128,0.00697386662165324
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,10240,0.024369066953659056
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,7168,0.019285333156585694
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,6144,0.01726079980532328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,5120,0.015613866845766702
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,4096,0.013607466220855713
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,3584,0.012812800208727517
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,3072,0.011966933806737263
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,2560,0.011175466577212016
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,2048,0.009967999656995137
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,1536,0.009469866752624512
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,65536,0.12226560115814208
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,1024,0.0083146666487058
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,768,0.008239999910195668
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,512,0.007931733131408691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,128,0.007043200234572093
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,1024,256,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,12288,0.027511467536290485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,8192,0.020957867304484047
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,10240,0.024234666426976522
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,7168,0.019298134247461955
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,6144,0.01725546717643738
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,5120,0.015683199961980185
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,4096,0.01360640029112498
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,3584,0.012846933801968894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,65536,0.12144746780395507
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,3072,0.011741866668065388
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,2560,0.011173333724339802
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,2048,0.01069760024547577
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,1536,0.00913279950618744
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,1024,0.008649599552154542
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,256,0.007417599856853485
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,512,0.007429333527882893
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,768,128,0.007044266661008198
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,12288,0.028330665826797486
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,10240,0.02505386670430501
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,8192,0.020536533991495767
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,7168,0.01936639944712321
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,6144,0.017257599035898845
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,5120,0.01602026621500651
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,4096,0.013639466961224875
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,65536,0.11963733037312825
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,3584,0.013289599617322286
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,2560,0.01120853324731191
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,3072,0.011946666240692138
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,2048,0.010696533322334289
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,1536,0.00947093367576599
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,768,0.008307200173536937
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,1024,0.00831573357184728
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,256,0.007419733206431071
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,512,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,16384,0.03570346832275391
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,12288,0.027512532472610474
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,10240,0.024780799945195518
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,8192,0.020946133136749267
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,65536,0.11932799816131592
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,7168,0.019709867238998414
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,6144,0.01726079980532328
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,5120,0.01602133313814799
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,4096,0.014074666301409402
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,3072,0.011993599931399028
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,3584,0.01276586651802063
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,2560,0.01153706709543864
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,2048,0.010285866260528565
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,1024,0.009058133761088053
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,1536,0.009065600236256917
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,768,0.008236800134181977
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,512,0.007931733131408691
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,256,0.007031466563542683
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,256,128,0.007080533107121785
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,12288,0.02792106668154399
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,16384,0.034884266058603924
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,65536,0.11980693340301514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,10240,0.024644267559051514
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,8192,0.020947200059890748
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,7168,0.019707733392715455
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,6144,0.017318399747212727
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,4096,0.01407360037167867
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,5120,0.015618133544921874
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,3584,0.012846933801968894
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,3072,0.012333866953849793
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,2048,0.01035520037015279
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,2560,0.011116799712181092
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,1024,0.00864746669928233
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,1536,0.009876267115275065
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,768,0.00783679982026418
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,512,0.007830399771531422
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,256,0.0074538667996724445
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,128,128,0.007019733389218648
TRTLLM,1.0.0rc6,NVIDIA GB200,gemm,torch_flow,nvfp4,1,2048,1536,0.009477333227793375
