fix some compiling errors

This commit is contained in:
joye
2025-05-15 14:36:02 +08:00
parent 726ae62113
commit 2fdcb55cf1
3 changed files with 8 additions and 9 deletions

View File

@@ -77,6 +77,9 @@ struct buffer_store;
template <index_t bytes>
struct buffer_store_if;
template <index_t bytes, bool pre_nop = false>
struct async_buffer_load;
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wundefined-reinterpret-cast"
// TODO: strict aliasing rule seems fail when reinterpret_cast between vector type

View File

@@ -92,18 +92,14 @@ CK_TILE_DEVICE auto load_tile_raw(T& tile,
template <typename LdsTileWindow_,
typename TileWindow_,
index_t i_access = -1,
bool oob_conditional_check = true,
bool pre_nop = false>
bool oob_conditional_check = true>
CK_TILE_DEVICE auto async_load_tile(LdsTileWindow_&& lds_tile,
const TileWindow_& tile_window,
number<i_access> = {},
bool_constant<oob_conditional_check> = {},
bool_constant<pre_nop> = {})
bool_constant<oob_conditional_check> = {})
{
return tile_window.async_load(lds_tile,
number<i_access>{},
bool_constant<oob_conditional_check>{},
bool_constant<pre_nop>{});
return tile_window.async_load(
lds_tile, number<i_access>{}, bool_constant<oob_conditional_check>{});
}
template <typename LdsTileWindow_,

View File

@@ -748,7 +748,7 @@ struct tile_window_linear
auto bottom_tensor_flag = cached_flags_[IAccess];
auto lds_bottom_tensor_thread_idx =
lds_tile.get_window_origin() + window_adaptor_thread_coord.get_bottom_index();
lds_tile.get_window_origin() + window_adaptor_coord.get_bottom_index();
const auto lds_coord =
make_tensor_coordinate(lds_tile.get_bottom_tensor_view().get_tensor_descriptor(),