Files
mscclpp/test/mp_unit/mp_unit_tests.cc
2023-06-25 12:40:12 +08:00

136 lines
4.1 KiB
C++

// Copyright (c) Microsoft Corporation.
// Licensed under the MIT license.
#include "mp_unit_tests.hpp"
#include <mpi.h>
#include <cstring>
#include <sstream>
#include "utils_internal.hpp"
const char gDefaultIpPort[] = "127.0.0.1:50053";
MultiProcessTestEnv* gEnv = nullptr;
int rankToLocalRank(int rank) {
if (gEnv == nullptr) throw std::runtime_error("rankToLocalRank is called before gEnv is initialized");
return rank % gEnv->nRanksPerNode;
}
int rankToNode(int rank) {
if (gEnv == nullptr) throw std::runtime_error("rankToNode is called before gEnv is initialized");
return rank / gEnv->nRanksPerNode;
}
mscclpp::Transport ibIdToTransport(int id) {
mscclpp::Transport IBs[] = {mscclpp::Transport::IB0, mscclpp::Transport::IB1, mscclpp::Transport::IB2,
mscclpp::Transport::IB3, mscclpp::Transport::IB4, mscclpp::Transport::IB5,
mscclpp::Transport::IB6, mscclpp::Transport::IB7};
return IBs[id];
}
MultiProcessTestEnv::MultiProcessTestEnv(int argc, const char** argv) : argc(argc), argv(argv) {}
static std::unordered_map<std::string, std::string> parseArgs(int argc, const char* argv[]) {
auto printUsage = [](const char* prog) {
std::stringstream ss;
ss << "Usage: " << prog << " [-ip_port IP:PORT]\n";
std::cout << ss.str();
};
std::unordered_map<std::string, std::string> options;
// Default values
options["ip_port"] = gDefaultIpPort;
// Parse the command line arguments
for (int i = 1; i < argc; i++) {
std::string arg = argv[i];
if (arg == "-ip_port") {
if (i + 1 < argc) {
options["ip_port"] = argv[++i];
} else {
throw std::invalid_argument("Error: -ip_port option requires an argument.\n");
}
} else if (arg == "-help" || arg == "-h") {
printUsage(argv[0]);
exit(0);
} else {
throw std::invalid_argument("Error: Unknown option " + std::string(argv[i]) + "\n");
}
}
return options;
}
void MultiProcessTestEnv::SetUp() {
MPI_Init(NULL, NULL);
MPI_Comm_rank(MPI_COMM_WORLD, &rank);
MPI_Comm_size(MPI_COMM_WORLD, &worldSize);
// get the local number of nodes with MPI
MPI_Comm shmcomm;
MPI_Comm_split_type(MPI_COMM_WORLD, MPI_COMM_TYPE_SHARED, 0, MPI_INFO_NULL, &shmcomm);
int shmrank;
MPI_Comm_size(shmcomm, &shmrank);
nRanksPerNode = shmrank;
MPI_Comm_free(&shmcomm);
// parse the command line arguments
args = parseArgs(argc, argv);
}
void MultiProcessTestEnv::TearDown() { MPI_Finalize(); }
void MultiProcessTest::TearDown() {
// Wait for all ranks to finish the previous test
MPI_Barrier(MPI_COMM_WORLD);
}
int main(int argc, char** argv) {
::testing::InitGoogleTest(&argc, argv);
gEnv = new MultiProcessTestEnv(argc, (const char**)argv);
::testing::AddGlobalTestEnvironment(gEnv);
return RUN_ALL_TESTS();
}
TEST_F(MultiProcessTest, Prelim) {
// Test to make sure the MPI environment is set up correctly
ASSERT_GE(gEnv->worldSize, 2);
}
TEST_F(MultiProcessTest, HostName) {
const size_t maxNameLen = 1024;
std::vector<char> buffer(gEnv->worldSize * maxNameLen, '\0');
std::string hostName = mscclpp::getHostName(maxNameLen, '\0');
// Copy hostName to buffer
memcpy(buffer.data() + gEnv->rank * maxNameLen, hostName.c_str(), hostName.size());
MPI_Allgather(MPI_IN_PLACE, 0, MPI_BYTE, buffer.data(), maxNameLen, MPI_BYTE, MPI_COMM_WORLD);
for (int rank = 0; rank < gEnv->worldSize; rank++) {
char rankHostName[maxNameLen + 1];
strncpy(rankHostName, buffer.data() + rank * maxNameLen, maxNameLen);
if (rankToNode(rank) == rankToNode(gEnv->rank)) {
ASSERT_EQ(std::string(rankHostName), hostName);
} else {
ASSERT_NE(std::string(rankHostName), hostName);
}
}
}
TEST_F(MultiProcessTest, HostHash) {
std::vector<uint64_t> buffer(gEnv->worldSize, 0);
uint64_t hostHash = mscclpp::getHostHash();
buffer[gEnv->rank] = hostHash;
MPI_Allgather(MPI_IN_PLACE, 0, MPI_BYTE, buffer.data(), sizeof(hostHash), MPI_BYTE, MPI_COMM_WORLD);
for (int rank = 0; rank < gEnv->worldSize; rank++) {
if (rankToNode(rank) == rankToNode(gEnv->rank)) {
ASSERT_EQ(buffer[rank], hostHash);
} else {
ASSERT_NE(buffer[rank], hostHash);
}
}
}