mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-16 19:09:59 +00:00
adding int8 direct that reads pre-vectorized data
[ROCm/composable_kernel commit: 050a1a6890]
This commit is contained in:
@@ -51,10 +51,8 @@ __device__ void threadwise_direct_convolution_1(InDesc,
|
||||
|
||||
const unsigned out_index = out_desc.Get1dIndex(n, k, ho, wo);
|
||||
|
||||
fused_multiply_add(p_out[out_index],
|
||||
p_wei[wei_index],
|
||||
p_in[in_index],
|
||||
p_out[out_index]);
|
||||
fused_multiply_accumulate(
|
||||
p_out[out_index], p_wei[wei_index], p_in[in_index]);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user