Load Q through lds, implement xor;

This commit is contained in:
aska-0096
2025-08-04 06:49:01 +00:00
parent 2d4e73d2b4
commit 746f4ccb99
4 changed files with 99 additions and 24 deletions

View File

@@ -42,6 +42,7 @@ SEQLENQ_MAP = {
# "32" : "32",
# "64" : "64"
"128" : "128",
# "256" : "256",
}
FMHA_FWD_DECODE_PIPELINE_MAP = {
@@ -668,6 +669,7 @@ def get_fmha_fwd_tile_dict_from_dtype(dtype : str) -> Optional[dict]:
# '16': FmhaFwdTileSize(16, 32, 64, 128, 32, 128, 1, 1, 1, 1, 1, 1, 16, 16, 32, 16, 16, 32, -1),
# '32': FmhaFwdTileSize(32, 32, 128, 128, 32, 128, 1, 1, 1, 1, 1, 1, 32, 32, 16, 32, 32, 16, -1),
'128': FmhaFwdTileSize(128, 64, 32, 128, 16, 128, 4, 1, 1, 4, 1, 1, 32, 32, 16, 32, 32, 16, -1),
# '256': FmhaFwdTileSize(256, 64, 32, 128, 16, 128, 8, 1, 1, 8, 1, 1, 32, 32, 16, 32, 32, 16, -1),
},
}
else: