diff --git a/aiter/configs/a4w4_blockscale_tuned_gemm.csv b/aiter/configs/a4w4_blockscale_tuned_gemm.csv index 51a05157f0..3988c91f18 100644 --- a/aiter/configs/a4w4_blockscale_tuned_gemm.csv +++ b/aiter/configs/a4w4_blockscale_tuned_gemm.csv @@ -921,3 +921,5 @@ cu_num,M,N,K,kernelId,splitK,us,kernelName,tflops,bw,errRatio 256,8,3072,1536,42,0,5.4682,_ZN5aiter42f4gemm_bf16_per1x32Fp4_BpreShuffle_128x128E,13.81,441.57,0.0 256,8,7168,2048,29,0,5.836,_ZN5aiter41f4gemm_bf16_per1x32Fp4_BpreShuffle_64x128E,40.25,1278.77,0.0 256,8,512,7168,29,0,9.6677,_ZN5aiter41f4gemm_bf16_per1x32Fp4_BpreShuffle_64x128E,6.07,193.62,0.0 +256,32768,2112,7168,48,0,293.0219,_ZN5aiter42f4gemm_bf16_per1x32Fp4_BpreShuffle_160x384E,3385.88,898.98,0.0 +256,65536,2112,7168,48,0,575.6528,_ZN5aiter42f4gemm_bf16_per1x32Fp4_BpreShuffle_160x384E,3447.0,902.06,0.0 diff --git a/aiter/configs/a4w4_blockscale_untuned_gemm.csv b/aiter/configs/a4w4_blockscale_untuned_gemm.csv index 3c91c37b07..e78f1eb3f5 100644 --- a/aiter/configs/a4w4_blockscale_untuned_gemm.csv +++ b/aiter/configs/a4w4_blockscale_untuned_gemm.csv @@ -193,3 +193,5 @@ M,N,K 3000, 7168, 2048 3000, 512, 7168 60000, 4096, 512 +32768, 2112, 7168 +65536, 2112, 7168