mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-19 22:39:03 +00:00
Batched gemm softmax gemm descriptor fix (#3564)
* Add rocm to prefix path for codegen * Fix issue with c0_matrix_mask construction
This commit is contained in:
@@ -1059,7 +1059,7 @@ struct DeviceBatchedGemmSoftmaxGemm_Xdl_CShuffle
|
||||
c_grid_desc_m_n)},
|
||||
has_main_k_block_loop{GridwiseGemm64::CalculateHasMainKBlockLoop(
|
||||
a_grid_desc_ak0_m_ak1.GetLength(I0) * a_grid_desc_ak0_m_ak1.GetLength(I2))},
|
||||
c0_matrix_mask{c.GetLength(I1)},
|
||||
c0_matrix_mask{b.GetLength(I0)},
|
||||
a_element_op{a_element_op_},
|
||||
b_element_op{b_element_op_},
|
||||
b1_element_op{b1_element_op_},
|
||||
|
||||
Reference in New Issue
Block a user