[rocm-libraries] ROCm/rocm-libraries#4872 (commit ca623f7)

[CK] Small improvements for grouped conv backward weight
 (#4872)

## Motivation

Improvements for CK Tile convolution builder run function and atol/rtol
calculations.

## Technical Details

- Add preprocessing function for wrw when k_batch is larger than 1 for
builder run function
- Divide num acums by number of groups to get real number of accums

## Test Plan

CI wrw tests

## Test Result

pending

## Submission Checklist

- [x] Look over the contributing guidelines at
https://github.com/ROCm/ROCm/blob/develop/CONTRIBUTING.md#pull-requests.

AICK-783
This commit is contained in:
Bartłomiej Kocot
2026-02-25 20:11:01 +00:00
committed by assistant-librarian[bot]
parent c90a363589
commit eede24de0d
5 changed files with 28 additions and 7 deletions

View File

@@ -244,7 +244,8 @@ class TestGroupedConvndBwdWeight : public ::testing::Test
float max_accumulated_value =
*std::max_element(wei_host.mData.begin(), wei_host.mData.end());
const ck::index_t num_accums = out.GetElementSize() / conv_param.K_;
const ck::index_t num_accums =
out.GetElementSize() / (conv_param.K_ * conv_param.G_);
const ck::index_t num_accums_split_k = split_k;
double rtol =
ck::utils::get_relative_threshold<InDataType, WeiDataType, AccDataType>(

View File

@@ -199,7 +199,8 @@ class TestGroupedConvndBwdWeight : public ::testing::Test
float max_accumulated_value =
*std::max_element(wei_host.mData.begin(), wei_host.mData.end());
const ck::index_t num_accums = out.GetElementSize() / conv_param.K_;
const ck::index_t num_accums =
out.GetElementSize() / (conv_param.K_ * conv_param.G_);
const ck::index_t num_accums_split_k = split_k;
double rtol =
ck::utils::get_relative_threshold<InDataType, WeiDataType, AccDataType>(