mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-07-01 04:07:56 +00:00
remove restriction of group mode hd192 no lse (#2252)
Co-authored-by: Jim <jimguo12@amd.com>
This commit is contained in:
@@ -517,7 +517,7 @@ def get_fwd_blobs(kernel_filter : Optional[str], receipt, optdim_list, mask_impl
|
|||||||
continue
|
continue
|
||||||
if hdim == 192 and tile.F_bn1 == 128:
|
if hdim == 192 and tile.F_bn1 == 128:
|
||||||
# NOTE: this is used to speedup deepseek prefill case, we don't gen training
|
# NOTE: this is used to speedup deepseek prefill case, we don't gen training
|
||||||
if pipeline.F_bias != 'no' or pipeline.F_lse == 't' or pipeline.F_dropout == 't':
|
if pipeline.F_bias != 'no' or pipeline.F_dropout == 't':
|
||||||
continue
|
continue
|
||||||
# logits_soft_cap is only allowed if no bias
|
# logits_soft_cap is only allowed if no bias
|
||||||
if not ((pipeline.F_logits == 't' and pipeline.F_bias == 'no') or pipeline.F_logits == 'f'):
|
if not ((pipeline.F_logits == 't' and pipeline.F_bias == 'no') or pipeline.F_logits == 'f'):
|
||||||
|
|||||||
Reference in New Issue
Block a user