mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-19 12:30:16 +00:00
[CKTILE] FMHA fwd trload lse fix (#3046)
* enable storelse for fmha_fwd_trload kernel
* fix lse in trload
* fix the mask related bug
[ROCm/composable_kernel commit: 0d3860dfdb]
This commit is contained in:
@@ -724,7 +724,6 @@ class KernelComponentFactory:
|
||||
and logits == "f"
|
||||
and bias == "no"
|
||||
and dropout == "f"
|
||||
and lse == "f"
|
||||
and skip == "f"
|
||||
):
|
||||
pipelines.append(FmhaFwdPipeline("qr_async_trload", "row", "f", "f", "f", "f", logits, bias, lse, dropout, squant, mask, skip, "t")) # fmt: skip
|
||||
|
||||
Reference in New Issue
Block a user