mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-07-03 05:37:34 +00:00
Fix the using of num_targets[] in run_group_hstu_attention
This commit is contained in:
@@ -847,11 +847,23 @@ bool run_group_hstu(const ck_tile::ArgParser& arg_parser, int num_group)
|
||||
|
||||
for(int i_grp = 0; i_grp < num_group; i_grp++)
|
||||
{
|
||||
int max_num_target = 0;
|
||||
|
||||
if(!num_targets.empty())
|
||||
{
|
||||
for(int i_batch = 0; i_batch < num_batch_per_group; i_batch++)
|
||||
{
|
||||
int i_global_batch = i_grp * num_batch_per_group * i_batch;
|
||||
|
||||
max_num_target = max(max_num_target, num_targets[i_global_batch]);
|
||||
};
|
||||
};
|
||||
|
||||
group_max_seqlens_q[i_grp] =
|
||||
group_max_uih_seqlens_q[i_grp] + group_contextual_seqlens[i_grp] + num_targets[i_grp];
|
||||
group_max_uih_seqlens_q[i_grp] + group_contextual_seqlens[i_grp] + max_num_target;
|
||||
max_max_seqlen_q = max(max_max_seqlen_q, group_max_seqlens_q[i_grp]);
|
||||
group_max_seqlens_kv[i_grp] =
|
||||
group_max_uih_seqlens_kv[i_grp] + group_contextual_seqlens[i_grp] + num_targets[i_grp];
|
||||
group_max_uih_seqlens_kv[i_grp] + group_contextual_seqlens[i_grp] + max_num_target;
|
||||
max_max_seqlen_kv = max(max_max_seqlen_kv, group_max_seqlens_kv[i_grp]);
|
||||
};
|
||||
|
||||
|
||||
Reference in New Issue
Block a user