From 644c6e520f08f70088f24b609b45c13124ad439f Mon Sep 17 00:00:00 2001 From: Linjun-AMD Date: Tue, 16 Dec 2025 06:18:38 -0600 Subject: [PATCH] fix sink error for asm fmha Signed-off-by: Linjun-AMD --- csrc/py_itfs_cu/asm_mha_fwd.cu | 1 + csrc/py_itfs_cu/asm_mha_varlen_fwd.cu | 1 + 2 files changed, 2 insertions(+) diff --git a/csrc/py_itfs_cu/asm_mha_fwd.cu b/csrc/py_itfs_cu/asm_mha_fwd.cu index d4c901fd2a..2efc1d7828 100644 --- a/csrc/py_itfs_cu/asm_mha_fwd.cu +++ b/csrc/py_itfs_cu/asm_mha_fwd.cu @@ -321,6 +321,7 @@ std::vector fmha_v3_fwd(at::Tensor &q, // [b, sq, hq, d] has_lse, quant_scale_enum::no_scale, true, + false, how_v3_bf16_cvt); TORCH_CHECK(t >= 0, "invalid argument for fmha_fwd"); } diff --git a/csrc/py_itfs_cu/asm_mha_varlen_fwd.cu b/csrc/py_itfs_cu/asm_mha_varlen_fwd.cu index 0189bd267c..6d2e9b8b19 100644 --- a/csrc/py_itfs_cu/asm_mha_varlen_fwd.cu +++ b/csrc/py_itfs_cu/asm_mha_varlen_fwd.cu @@ -399,6 +399,7 @@ fmha_v3_varlen_fwd(at::Tensor &q, // [total_q, hq, d] has_lse, quant_scale_enum::no_scale, true, + false, how_v3_bf16_cvt); TORCH_CHECK(t >= 0, "invalid argument for fmha_v3_varlen_fwd 3"); }