Allow binding allocated memory to NVLS multicast pointer (#290)

And change NVLS multimem instructions to static functions
This commit is contained in:
Roshan Dathathri
2024-04-18 17:11:31 -07:00
committed by GitHub
parent 64d837f9ab
commit 41e0964d93
5 changed files with 26 additions and 19 deletions

View File

@@ -41,8 +41,8 @@ extern "C" __global__ void __launch_bounds__(1024, 1)
for (int idx = my_st + my_offset; idx < my_en; idx += my_step) {
uint4 val;
nvlsPtrs.multimemLoad(val, mc_ptr + idx);
nvlsPtrs.multimemStore(val, mc_ptr + idx);
DeviceMulticastPointerDeviceHandle::multimemLoad(val, mc_ptr + idx);
DeviceMulticastPointerDeviceHandle::multimemStore(val, mc_ptr + idx);
}
deviceSyncer.sync(gridDim.x);