mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-06-29 11:16:59 +00:00
Use direct sweep_tile in decode pipeline.
Replace the local tile_sweeper wrapper call with sweep_tile(...) to keep the decode path simpler while preserving behavior. Made-with: Cursor
This commit is contained in:
@@ -67,8 +67,7 @@ struct TopkSoftmaxDecodePipeline
|
||||
w_(idx) = WeightType(1) / (WeightType(1) + exp(-w_(idx)));
|
||||
}
|
||||
};
|
||||
tile_sweeper<decltype(w_), decltype(w_f)> ts{w_, w_f};
|
||||
ts();
|
||||
sweep_tile(w_, w_f);
|
||||
return w_;
|
||||
}();
|
||||
|
||||
|
||||
Reference in New Issue
Block a user