mirror of
https://github.com/NVIDIA/cutlass.git
synced 2026-04-19 22:38:56 +00:00
update 3.8 v2 (#2112)
* update 3.8 v2 * update 3.8 --------- Co-authored-by: yuzhai <yuzhai@nvidia.com>
This commit is contained in:
@@ -489,7 +489,7 @@ def get_valid_schedules(tile_description, cuda_version, is_aligned, data_types,
|
||||
if is_fp32 and (is_tn or is_nn) and (cta_n % cta_k != 0):
|
||||
return [], []
|
||||
|
||||
grouped = gemm_kind == GemmKind.GroupedGemmUniversal3x
|
||||
grouped = is_grouped(gemm_kind)
|
||||
if grouped:
|
||||
# the following cases are unsupported by grouped GEMM
|
||||
if not is_aligned:
|
||||
|
||||
Reference in New Issue
Block a user