mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-06-29 19:28:33 +00:00
Add buffer_load_lds synchronization
This commit is contained in:
@@ -679,6 +679,7 @@ struct F16xMXF4FlatmmPipelineAGmemBGmemCRegV1
|
||||
async_load_tile(lds_tile_a, dram_tile_a);
|
||||
};
|
||||
auto prefill_lds_a_stage2 = [&](auto lds_tile_a) {
|
||||
async_load_fence();
|
||||
// data has been stored in lds, no need more operation.
|
||||
static_assert(std::is_same_v<AElementFunction, identity>,
|
||||
"buffer_load_lds don't support element func fot A before mfma");
|
||||
|
||||
Reference in New Issue
Block a user