both allgather algorithms

This commit is contained in:
Saeed Maleki
2023-03-19 06:35:40 +00:00
parent 17cbc84a14
commit 3e8f6758e5

View File

@@ -180,7 +180,7 @@ int main(int argc, const char *argv[])
int *data_d;
uint64_t *flag_d;
size_t data_size = 1024*1024*1024;
size_t data_size = 1024*1024;
int nelemsPerGPU = data_size / sizeof(int) / world_size;
CUDACHECK(cudaMalloc(&data_d, data_size));
CUDACHECK(cudaMalloc(&flag_d, sizeof(uint64_t)));