diff --git a/include/ck_tile/core/arch/amd_buffer_addressing.hpp b/include/ck_tile/core/arch/amd_buffer_addressing.hpp index 50f81ecf84..69443abd1c 100644 --- a/include/ck_tile/core/arch/amd_buffer_addressing.hpp +++ b/include/ck_tile/core/arch/amd_buffer_addressing.hpp @@ -77,6 +77,9 @@ struct buffer_store; template struct buffer_store_if; +template +struct async_buffer_load; + #pragma clang diagnostic push #pragma clang diagnostic ignored "-Wundefined-reinterpret-cast" // TODO: strict aliasing rule seems fail when reinterpret_cast between vector type diff --git a/include/ck_tile/core/tensor/load_tile.hpp b/include/ck_tile/core/tensor/load_tile.hpp index 7168551abf..8b7541bf23 100644 --- a/include/ck_tile/core/tensor/load_tile.hpp +++ b/include/ck_tile/core/tensor/load_tile.hpp @@ -92,18 +92,14 @@ CK_TILE_DEVICE auto load_tile_raw(T& tile, template + bool oob_conditional_check = true> CK_TILE_DEVICE auto async_load_tile(LdsTileWindow_&& lds_tile, const TileWindow_& tile_window, number = {}, - bool_constant = {}, - bool_constant = {}) + bool_constant = {}) { - return tile_window.async_load(lds_tile, - number{}, - bool_constant{}, - bool_constant{}); + return tile_window.async_load( + lds_tile, number{}, bool_constant{}); } template