Files
mscclpp/test/unit/fifo_tests.cu
Saeed Maleki 8d1b984bed Change device handle interfaces & others (#142)
* Changed device handle interfaces
* Changed proxy service interfaces
* Move device code into separate files
* Fixed FIFO polling issues
* Add configuration arguments in several interface functions

---------

Co-authored-by: Changho Hwang <changhohwang@microsoft.com>
Co-authored-by: Binyang Li <binyli@microsoft.com>
Co-authored-by: root <root@a100-saemal0.qxveptpukjsuthqvv514inp03c.gx.internal.cloudapp.net>
2023-08-16 20:00:56 +08:00

80 lines
2.1 KiB
Plaintext

// Copyright (c) Microsoft Corporation.
// Licensed under the MIT license.
#include <gtest/gtest.h>
#include <mscclpp/cuda_utils.hpp>
#include <mscclpp/fifo.hpp>
#include <mscclpp/numa.hpp>
#include <mscclpp/utils.hpp>
#define ITER 10000 // should be larger than the FIFO size for proper testing
__constant__ mscclpp::FifoDeviceHandle gFifoTestFifoDeviceHandle;
__global__ void kernelFifoTest() {
if (threadIdx.x + blockIdx.x * blockDim.x != 0) return;
mscclpp::FifoDeviceHandle& fifo = gFifoTestFifoDeviceHandle;
mscclpp::ProxyTrigger trigger;
for (uint64_t i = 1; i < ITER + 1; ++i) {
trigger.fst = i;
trigger.snd = i;
uint64_t curFifoHead = fifo.push(trigger);
if (i % fifo.size == 0) {
fifo.sync(curFifoHead);
}
}
}
TEST(FifoTest, Fifo) {
int cudaNum;
MSCCLPP_CUDATHROW(cudaGetDevice(&cudaNum));
int numaNode = mscclpp::getDeviceNumaNode(cudaNum);
mscclpp::numaBind(numaNode);
mscclpp::Fifo hostFifo;
if (hostFifo.size() >= ITER) {
FAIL() << "ITER is too small for proper testing.";
}
mscclpp::FifoDeviceHandle devFifo = hostFifo.deviceHandle();
MSCCLPP_CUDATHROW(cudaMemcpyToSymbol(gFifoTestFifoDeviceHandle, &devFifo, sizeof(devFifo)));
kernelFifoTest<<<1, 1>>>();
MSCCLPP_CUDATHROW(cudaGetLastError());
mscclpp::ProxyTrigger trigger;
trigger.fst = 0;
trigger.snd = 0;
uint64_t spin = 0;
uint64_t flushCnt = 0;
mscclpp::Timer timer(3);
for (uint64_t i = 0; i < ITER; ++i) {
while (trigger.fst == 0 || trigger.snd == 0) {
trigger = hostFifo.poll();
if (spin++ > 1000000) {
FAIL() << "Polling is stuck.";
}
}
// see `src/proxy.cc` for the reason of this line
trigger.snd ^= ((uint64_t)1 << (uint64_t)63);
ASSERT_TRUE(trigger.fst == (i + 1));
ASSERT_TRUE(trigger.snd == (i + 1));
hostFifo.pop();
if ((++flushCnt % hostFifo.size()) == 0) {
hostFifo.flushTail();
}
trigger.fst = 0;
spin = 0;
}
hostFifo.flushTail(true);
std::stringstream ss;
ss << "FifoTest.Fifo: " << (float)timer.elapsed() / ITER << " us/iter\n";
std::cout << ss.str();
MSCCLPP_CUDATHROW(cudaDeviceSynchronize());
}