mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-05 06:01:23 +00:00
add fp8 as dst (#1830)
This commit is contained in:
@@ -113,7 +113,7 @@ struct SmoothquantPipelineOnePass
|
||||
sweep_tile(qy, [&](auto idx) {
|
||||
constexpr auto i_idx = make_tuple(idx[number<0>{}]);
|
||||
auto qy_ = y[idx] / yscale[i_idx];
|
||||
qy(idx) = saturates<QYDataType>{}(qy_);
|
||||
qy(idx) = type_convert<QYDataType>(saturates<QYDataType>{}(qy_));
|
||||
});
|
||||
store_tile(qy_window, qy);
|
||||
}
|
||||
|
||||
@@ -136,7 +136,7 @@ struct SmoothquantPipelineTwoPass
|
||||
sweep_tile(qy, [&](auto idx) {
|
||||
constexpr auto i_idx = make_tuple(idx[number<0>{}]);
|
||||
auto qy_ = y[idx] / yscale[i_idx];
|
||||
qy(idx) = saturates<QYDataType>{}(qy_);
|
||||
qy(idx) = type_convert<QYDataType>(saturates<QYDataType>{}(qy_));
|
||||
});
|
||||
store_tile(qy_window, qy);
|
||||
|
||||
|
||||
Reference in New Issue
Block a user