mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-20 06:49:15 +00:00
[CK_TILE] Add permuteN optimization to remove lds operation in c_shuffle (#2764)
* permuteN optimization to remove lds operation in c_shuffle * add the change log --------- Co-authored-by: ThomasNing <thomas.ning@amd.com>
This commit is contained in:
@@ -175,6 +175,9 @@ struct sequence
|
||||
return sequence<type::get(number<Ids>{})...>{};
|
||||
}
|
||||
|
||||
CK_TILE_HOST_DEVICE static constexpr auto sum() { return (Is + ... + 0); }
|
||||
CK_TILE_HOST_DEVICE static constexpr auto product() { return (Is * ... * 1); }
|
||||
|
||||
// modify element at index "I" with value "X"
|
||||
template <index_t I, index_t X>
|
||||
CK_TILE_HOST_DEVICE static constexpr auto modify(number<I>, number<X>)
|
||||
|
||||
Reference in New Issue
Block a user