Merge commit 'c0c2ded56684a3a04ad9df1b907d27ae7635067d' into develop

This commit is contained in:
assistant-librarian[bot]
2025-08-12 11:11:28 +00:00
parent d869fdb172
commit 5e9cfbe15c

4
example/ck_tile/01_fmha/fmha_fwd.cpp Executable file → Normal file
View File

@@ -525,8 +525,8 @@ bool run(const ck_tile::ArgParser& arg_parser)
flop += nhead * (static_cast<std::size_t>(2) * mask.get_unmaskarea() * hdim_q +
static_cast<std::size_t>(2) * mask.get_unmaskarea() * hdim_v);
num_byte += nhead * (sizeof(QDataType) * real_seqlen_q * hdim_q +
sizeof(ODataType) * real_seqlen_q * hdim_v);
num_byte += nhead * (sizeof(QDataType) * real_seqlen_q * hdim_q +
sizeof(ODataType) * real_seqlen_q * hdim_v);
num_byte += nhead_k * (sizeof(KDataType) * real_seqlen_k * hdim_q +
sizeof(VDataType) * hdim_v * real_seqlen_k);
}