mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-13 09:45:56 +00:00
Add splitk gemm fp16 @ fp16 with fp8 compute instances (#983)
* Add ComputeType * Update for compatibility * Add instances * Update profiler api
This commit is contained in:
@@ -30,7 +30,8 @@ template <typename ADataType,
|
||||
typename CDataType,
|
||||
typename ALayout,
|
||||
typename BLayout,
|
||||
typename CLayout>
|
||||
typename CLayout,
|
||||
typename ComputeType = CDataType>
|
||||
bool profile_gemm_splitk_impl(int do_verification,
|
||||
int init_method,
|
||||
bool do_log,
|
||||
@@ -103,7 +104,8 @@ bool profile_gemm_splitk_impl(int do_verification,
|
||||
CDataType,
|
||||
AElementOp,
|
||||
BElementOp,
|
||||
CElementOp>;
|
||||
CElementOp,
|
||||
ComputeType>;
|
||||
|
||||
// get device op instances
|
||||
const auto op_ptrs = ck::tensor_operation::device::instance::DeviceOperationInstanceFactory<
|
||||
@@ -120,7 +122,8 @@ bool profile_gemm_splitk_impl(int do_verification,
|
||||
AccDataType,
|
||||
AElementOp,
|
||||
BElementOp,
|
||||
CElementOp>;
|
||||
CElementOp,
|
||||
ComputeType>;
|
||||
|
||||
auto ref_gemm = ReferenceGemmInstance{};
|
||||
auto ref_invoker = ref_gemm.MakeInvoker();
|
||||
|
||||
Reference in New Issue
Block a user