adding int8 direct that reads pre-vectorized data

[ROCm/composable_kernel commit: 050a1a6890]
This commit is contained in:
Chao Liu
2019-03-19 00:05:41 -05:00
parent 14ad082d6c
commit 80f2ab2e09
6 changed files with 247 additions and 95 deletions

View File

@@ -51,10 +51,8 @@ __device__ void threadwise_direct_convolution_1(InDesc,
const unsigned out_index = out_desc.Get1dIndex(n, k, ho, wo);
fused_multiply_add(p_out[out_index],
p_wei[wei_index],
p_in[in_index],
p_out[out_index]);
fused_multiply_accumulate(
p_out[out_index], p_wei[wei_index], p_in[in_index]);
}
}
}