mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-04 05:31:24 +00:00
enable compilation of INSTANCES_ONLY for Windows (#1082)
* enable compilation of INSTANCES_ONLY for Windows * suppress ROCMChecks warnings on GoogleTests * suppress -Wfloat-equal warning on GoogleTests --------- Co-authored-by: Illia Silin <98187287+illsilin@users.noreply.github.com>
This commit is contained in:
@@ -174,6 +174,11 @@ struct PassThrough
|
||||
{
|
||||
y = x;
|
||||
}
|
||||
template <>
|
||||
__host__ __device__ void operator()<int4_t, int>(int4_t& y, const int& x) const
|
||||
{
|
||||
y = type_convert<int4_t>(x);
|
||||
}
|
||||
#endif
|
||||
|
||||
template <>
|
||||
|
||||
@@ -119,7 +119,7 @@ struct GridwiseElementwiseLayernormWelfordVariance_mk_to_mk
|
||||
index_t num_k_block_tile_iteration,
|
||||
AccDataType epsilon,
|
||||
const InDataTypePointerTuple p_in_global_tuple,
|
||||
XDataType* const __restrict__ p_x_lds,
|
||||
XDataType* const __restrict__ p_x_lds_,
|
||||
const GammaDataType* const __restrict__ p_gamma_global,
|
||||
const BetaDataType* const __restrict__ p_beta_global,
|
||||
YDataType* const __restrict__ p_y_global,
|
||||
@@ -149,7 +149,7 @@ struct GridwiseElementwiseLayernormWelfordVariance_mk_to_mk
|
||||
p_y_global, y_grid_desc_m_k.GetElementSpaceSize());
|
||||
|
||||
auto x_lds_val_buf = make_dynamic_buffer<AddressSpaceEnum::Lds>(
|
||||
p_x_lds, x_grid_desc_m_k.GetElementSpaceSize() / grid_size);
|
||||
p_x_lds_, x_grid_desc_m_k.GetElementSpaceSize() / grid_size);
|
||||
|
||||
auto in_thread_buf_tuple = generate_tuple(
|
||||
[&](auto) {
|
||||
|
||||
@@ -328,7 +328,7 @@ struct WmmaSelector
|
||||
}
|
||||
#ifdef CK_EXPERIMENTAL_BIT_INT_EXTENSION_INT4
|
||||
template <>
|
||||
static constexpr auto GetWmma<int4_t, int, 16, 16>()
|
||||
static constexpr auto GetWmma<int4_t, int4_t, int, 16, 16>()
|
||||
{
|
||||
return WmmaInstr::wmma_i32_16x16x16_iu4;
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user