mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-24 14:54:47 +00:00
[CK_TILE] Add permuteN optimization to remove lds operation in c_shuffle (#2764)
* permuteN optimization to remove lds operation in c_shuffle
* add the change log
---------
Co-authored-by: ThomasNing <thomas.ning@amd.com>
[ROCm/composable_kernel commit: 75570d0fa8]
This commit is contained in:
@@ -175,6 +175,9 @@ struct sequence
|
||||
return sequence<type::get(number<Ids>{})...>{};
|
||||
}
|
||||
|
||||
CK_TILE_HOST_DEVICE static constexpr auto sum() { return (Is + ... + 0); }
|
||||
CK_TILE_HOST_DEVICE static constexpr auto product() { return (Is * ... * 1); }
|
||||
|
||||
// modify element at index "I" with value "X"
|
||||
template <index_t I, index_t X>
|
||||
CK_TILE_HOST_DEVICE static constexpr auto modify(number<I>, number<X>)
|
||||
|
||||
Reference in New Issue
Block a user