mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-14 18:17:44 +00:00
Add bias scalar vectorload = 1 for gemm bias gemm (#791)
* first change bias load
* add bias dim and scalervector parameter
* make CDE0BlockTransferSrcVectorDim not work
* changse toinstance
* add limit for CDE0BlockTransferSrcScalarPerVector
[ROCm/composable_kernel commit: 50643dd555]
This commit is contained in:
@@ -173,6 +173,8 @@ using DeviceGemmInstance =
|
||||
8,
|
||||
8,
|
||||
true,
|
||||
9, // D0sTransferSrcVectorDim
|
||||
4, // D0sTransferSrcScalaerPerVector
|
||||
S<8, 32, 1>, // B1BlockTransfer
|
||||
S<0, 2, 1>,
|
||||
S<0, 2, 1>,
|
||||
@@ -189,7 +191,7 @@ int main(int argc, char* argv[])
|
||||
{
|
||||
bool do_verification = true;
|
||||
int init_method = 1;
|
||||
bool time_kernel = false;
|
||||
bool time_kernel = true;
|
||||
|
||||
// GEMM shape
|
||||
ck::index_t M = 1024;
|
||||
|
||||
Reference in New Issue
Block a user