Add grouped convnd dataset tests for bwd_data, bwd_weight and make them parallel (#3380)

* Parallelization in dataset generation

* Parallelizable tests for fwd, bwd data, bwd weight with datasets

* .gitignore generated datasets

* Test parallelization script with round-robin GPU scheduling

* Parallelization updates to test generation and running

* Dataset paths relative to executable

* Update output from test generation

* Default to one GPU in test generation

* Add small dataset tests to Jenkins

* Update copyright lines

* Update test_data/generate_test_dataset.sh

Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com>

* Move trap disable

* Common get path function

---------

Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com>

[ROCm/composable_kernel commit: fe35ba5dac]
This commit is contained in:
Johannes Graner
2025-12-15 13:38:25 +01:00
committed by GitHub
parent a45c051ac9
commit 2fe4c8acec
10 changed files with 2349 additions and 331 deletions

View File

@@ -0,0 +1,246 @@
// Copyright (c) Advanced Micro Devices, Inc., or its affiliates.
// SPDX-License-Identifier: MIT
#pragma once
#include <fstream>
#include <filesystem>
#include <iostream>
#include <sstream>
#include <string>
#include <vector>
#include "ck/library/utility/convolution_parameter.hpp"
namespace ck {
namespace test {
namespace fs = std::filesystem;
// Helper function to find test_data directory relative to the test binary
static std::string GetTestDataPath()
{
// Get the path to the current executable
fs::path exe_path = fs::read_symlink("/proc/self/exe");
// Get the directory containing the executable
fs::path current_dir = exe_path.parent_path();
// Search for test_data directory by going up the directory tree
// This makes the code robust regardless of build directory depth
while(current_dir != current_dir.root_path())
{
fs::path test_data_path = current_dir / "test_data";
if(fs::exists(test_data_path) && fs::is_directory(test_data_path))
{
return test_data_path.string();
}
current_dir = current_dir.parent_path();
}
// If not found, return empty string
std::cerr << "ERROR: Could not find test_data directory relative to executable" << std::endl;
return "";
}
// CSV Reader Function for Loading Test Cases
// Reads convolution parameters from CSV file and returns vector of ConvParam structures
inline std::vector<ck::utils::conv::ConvParam> load_csv_test_cases(const std::string& filename)
{
std::vector<ck::utils::conv::ConvParam> conv_params; // Return vector
std::ifstream file(filename); // Open CSV file
if(!file.is_open())
{
std::cerr << "ERROR: Cannot open CSV file: " << filename << std::endl;
return conv_params; // Return empty vector on error
}
std::string line;
int line_number = 0;
// Read file line by line
while(std::getline(file, line))
{
line_number++;
// Skip comment lines (starting with #) and empty lines
if(line.empty() || line[0] == '#')
{
continue;
}
// Skip header line (contains column names)
if(line.find("NDim,Groups,BatchSize") != std::string::npos)
{
continue;
}
// Parse CSV line using stringstream
std::stringstream ss(line);
std::string cell;
std::vector<std::string> row;
// Split line by commas
while(std::getline(ss, cell, ','))
{
row.push_back(cell);
}
// Validate row has correct number of columns
if(row.size() < 19)
{ // Need at least 19 columns for 2D (excluding TestName)
std::cerr << "WARNING: Line " << line_number << " has insufficient columns ("
<< row.size() << "), skipping" << std::endl;
continue;
}
try
{
// Parse CSV data into ConvParam structure
// CSV Format:
// NDim,Groups,BatchSize,OutChannels,InChannels,KernelH,KernelW,InputH,InputW,OutputH,OutputW,StrideH,StrideW,DilationH,DilationW,LeftPadH,LeftPadW,RightPadH,RightPadW,TestName
int NDim = std::stoi(row[0]);
int Groups = std::stoi(row[1]);
int BatchSize = std::stoi(row[2]);
int OutChannels = std::stoi(row[3]);
int InChannels = std::stoi(row[4]);
if(NDim == 1)
{
// 1D Convolution: Need fewer columns for 1D parameters
if(row.size() < 13)
{
std::cerr << "WARNING: 1D convolution on line " << line_number
<< " needs 13+ columns, has " << row.size() << ", skipping"
<< std::endl;
continue;
}
// 1D Convolution: {NDim, Groups, BatchSize, OutChannels, InChannels,
// {KernelW}, {InputW}, {StrideW}, {DilationW}, {LeftPadW}, {RightPadW}}
ck::utils::conv::ConvParam param = {
NDim, // NDim = 1
Groups, // Groups
BatchSize, // Batch size
OutChannels, // Output channels
InChannels, // Input channels
{std::stoi(row[5])}, // Kernel: {W}
{std::stoi(row[7])}, // Input: {W}
{std::stoi(row[11])}, // Stride: {W}
{std::stoi(row[13])}, // Dilation: {W}
{std::stoi(row[15])}, // Left pad: {W}
{std::stoi(row[17])} // Right pad: {W}
};
conv_params.push_back(param);
}
else if(NDim == 2)
{
// 2D Convolution: {NDim, Groups, BatchSize, OutChannels, InChannels,
// {KernelH,KernelW}, {InputH,InputW}, {StrideH,StrideW}, {DilationH,DilationW},
// {LeftPadH,LeftPadW}, {RightPadH,RightPadW}}
ck::utils::conv::ConvParam param = {
NDim, // NDim = 2
Groups, // Groups
BatchSize, // Batch size
OutChannels, // Output channels
InChannels, // Input channels
{std::stoi(row[5]), std::stoi(row[6])}, // Kernel: {H, W}
{std::stoi(row[7]), std::stoi(row[8])}, // Input: {H, W}
{std::stoi(row[11]), std::stoi(row[12])}, // Stride: {H, W}
{std::stoi(row[13]), std::stoi(row[14])}, // Dilation: {H, W}
{std::stoi(row[15]), std::stoi(row[16])}, // Left pad: {H, W}
{std::stoi(row[17]), std::stoi(row[18])} // Right pad: {H, W}
};
conv_params.push_back(param);
}
else if(NDim == 3)
{
// 3D Convolution: Need more columns for 3D parameters
if(row.size() < 26)
{
std::cerr << "WARNING: 3D convolution on line " << line_number
<< " needs 26+ columns, has " << row.size() << ", skipping"
<< std::endl;
continue;
}
// 3D Convolution: {NDim, Groups, BatchSize, OutChannels, InChannels,
// {KernelD,KernelH,KernelW}, {InputD,InputH,InputW}, {OutputD,OutputH,OutputW},
// {StrideD,StrideH,StrideW}, {DilationD,DilationH,DilationW},
// {LeftPadD,LeftPadH,LeftPadW}, {RightPadD,RightPadH,RightPadW}}
ck::utils::conv::ConvParam param = {
NDim, // NDim = 3
Groups, // Groups
BatchSize, // Batch size
OutChannels, // Output channels
InChannels, // Input channels
{std::stoi(row[5]), std::stoi(row[6]), std::stoi(row[7])}, // Kernel: {D, H, W}
{std::stoi(row[8]), std::stoi(row[9]), std::stoi(row[10])}, // Input: {D, H, W}
{std::stoi(row[14]),
std::stoi(row[15]),
std::stoi(row[16])}, // Stride: {D, H, W}
{std::stoi(row[17]),
std::stoi(row[18]),
std::stoi(row[19])}, // Dilation: {D, H, W}
{std::stoi(row[20]),
std::stoi(row[21]),
std::stoi(row[22])}, // Left pad: {D, H, W}
{std::stoi(row[23]),
std::stoi(row[24]),
std::stoi(row[25])} // Right pad: {D, H, W}
};
conv_params.push_back(param);
}
else
{
std::cerr << "WARNING: Unsupported NDim=" << NDim << " on line " << line_number
<< ", skipping" << std::endl;
}
}
catch(const std::exception& e)
{
std::cerr << "ERROR: Failed to parse line " << line_number << ": " << e.what()
<< std::endl;
continue;
}
}
file.close();
std::cout << "Loaded " << conv_params.size() << " test cases from " << filename << std::endl;
return conv_params;
}
// Helper function to load CSV test cases and populate conv_params vector
// Returns true if loading succeeded, false otherwise
inline bool load_and_populate_test_cases(const std::vector<std::string>& csv_paths,
std::vector<ck::utils::conv::ConvParam>& conv_params,
const std::string& dimension_label)
{
for(const auto& csv_path : csv_paths)
{
auto csv_cases = load_csv_test_cases(csv_path);
if(!csv_cases.empty())
{
// Successfully loaded CSV data - add all test cases to conv_params
for(const auto& test_case : csv_cases)
{
conv_params.push_back(test_case);
}
std::cout << "Loaded " << csv_cases.size() << " " << dimension_label
<< " test cases from " << csv_path << std::endl;
return true;
}
}
// Failed to load from any path
std::cerr << "ERROR: Failed to load CSV test data from any of these locations:" << std::endl;
for(const auto& path : csv_paths)
{
std::cerr << " - " << path << std::endl;
}
std::cerr << "\nPlease ensure CSV test data exists in one of these locations." << std::endl;
std::cerr << "Run generate_test_dataset.sh in test_data/ to create test datasets." << std::endl;
return false;
}
} // namespace test
} // namespace ck

View File

@@ -9,6 +9,10 @@ if(GPU_TARGETS MATCHES "gfx9|gfx11|gfx12")
add_executable(test_grouped_convnd_bwd_data_xdl_large_cases test_grouped_convnd_bwd_data_xdl_large_cases.cpp)
target_compile_options(test_grouped_convnd_bwd_data_xdl_large_cases PRIVATE -Wno-global-constructors -Wno-undef)
target_link_libraries(test_grouped_convnd_bwd_data_xdl_large_cases PRIVATE gtest_main getopt::getopt utility device_grouped_conv2d_bwd_data_instance device_grouped_conv3d_bwd_data_instance)
add_executable(test_grouped_convnd_bwd_data_dataset_xdl test_grouped_convnd_bwd_data_dataset_xdl.cpp)
target_compile_options(test_grouped_convnd_bwd_data_dataset_xdl PRIVATE -Wno-global-constructors -Wno-undef)
target_link_libraries(test_grouped_convnd_bwd_data_dataset_xdl PRIVATE gtest_main getopt::getopt utility device_grouped_conv2d_bwd_data_instance device_grouped_conv3d_bwd_data_instance)
endif()
add_gtest_executable(test_grouped_convnd_bwd_data_wmma test_grouped_convnd_bwd_data_wmma.cpp)
if(result EQUAL 0)

View File

@@ -0,0 +1,317 @@
// Copyright (c) Advanced Micro Devices, Inc., or its affiliates.
// SPDX-License-Identifier: MIT
#include <cstdlib> // Standard C library (exit codes, malloc)
#include <iostream> // C++ I/O streams (cout, cerr)
#include <initializer_list> // C++ initializer list support (unused here)
#include <vector> // C++ vector container - stores test cases
#include <string> // String operations
#include <gtest/gtest.h> // Google Test framework - provides TEST_P, INSTANTIATE_TEST_SUITE_P
#include "profiler/profile_grouped_conv_bwd_data_impl.hpp" // The actual GPU profiler that does convolution work
#include "../common/csv_test_loader.hpp" // Shared CSV test case loader
using namespace ck::tensor_layout::convolution; // Import tensor layout names (GNHWK, GKYXC, etc.)
// Load CSV data for 2D tests
static std::vector<ck::utils::conv::ConvParam> Get2DTestCases()
{
static std::vector<ck::utils::conv::ConvParam> test_cases;
if(test_cases.empty())
{
std::string test_data_dir = ck::test::GetTestDataPath();
if(test_data_dir.empty())
{
std::cerr << "FATAL: test_data directory not found" << std::endl;
return test_cases;
}
std::vector<std::string> csv_paths = {test_data_dir + "/conv_test_set_2d_dataset.csv"};
bool loaded = ck::test::load_and_populate_test_cases(csv_paths, test_cases, "2D");
if(!loaded)
{
std::cerr << "FATAL: Failed to load 2D test cases from " << csv_paths[0] << std::endl;
}
}
return test_cases;
}
// Load CSV data for 3D tests
static std::vector<ck::utils::conv::ConvParam> Get3DTestCases()
{
static std::vector<ck::utils::conv::ConvParam> test_cases;
if(test_cases.empty())
{
std::string test_data_dir = ck::test::GetTestDataPath();
if(test_data_dir.empty())
{
std::cerr << "FATAL: test_data directory not found" << std::endl;
return test_cases;
}
std::vector<std::string> csv_paths = {test_data_dir + "/conv_test_set_3d_dataset.csv"};
bool loaded = ck::test::load_and_populate_test_cases(csv_paths, test_cases, "3D");
if(!loaded)
{
std::cerr << "FATAL: Failed to load 3D test cases from " << csv_paths[0] << std::endl;
}
}
return test_cases;
}
// Helper template to run a single backward data convolution test with split_k
template <ck::index_t NDimSpatial,
typename OutLayout,
typename WeiLayout,
typename InLayout,
typename DataType>
bool RunConvBwdDataTest(const ck::utils::conv::ConvParam& param, ck::index_t split_k)
{
return ck::profiler::profile_grouped_conv_bwd_data_impl<NDimSpatial,
OutLayout,
WeiLayout,
InLayout,
DataType,
DataType,
DataType>(true, // do_verification
1, // init_method
false, // do_log
false, // time_kernel
param, // ConvParam
split_k, // Split-K value
-1); // instance_index
}
// 2D Tests - GNHWK layout - Float - SplitK=1
class TestGroupedConvndBwdData2dGNHWKFloatSplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData2dGNHWKFloatSplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<2, GNHWK, GKYXC, GNHWC, float>(GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData2dGNHWKFloatSplitK1,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - GNHWK layout - Float - SplitK=2
class TestGroupedConvndBwdData2dGNHWKFloatSplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData2dGNHWKFloatSplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<2, GNHWK, GKYXC, GNHWC, float>(GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData2dGNHWKFloatSplitK2,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - GNHWK layout - Half - SplitK=1
class TestGroupedConvndBwdData2dGNHWKHalfSplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData2dGNHWKHalfSplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<2, GNHWK, GKYXC, GNHWC, ck::half_t>(GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData2dGNHWKHalfSplitK1,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - GNHWK layout - Half - SplitK=2
class TestGroupedConvndBwdData2dGNHWKHalfSplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData2dGNHWKHalfSplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<2, GNHWK, GKYXC, GNHWC, ck::half_t>(GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData2dGNHWKHalfSplitK2,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - GNHWK layout - BFloat16 - SplitK=1
class TestGroupedConvndBwdData2dGNHWKBFloat16SplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData2dGNHWKBFloat16SplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<2, GNHWK, GKYXC, GNHWC, ck::bhalf_t>(GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData2dGNHWKBFloat16SplitK1,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - GNHWK layout - BFloat16 - SplitK=2
class TestGroupedConvndBwdData2dGNHWKBFloat16SplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData2dGNHWKBFloat16SplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<2, GNHWK, GKYXC, GNHWC, ck::bhalf_t>(GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData2dGNHWKBFloat16SplitK2,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - NHWGK layout - Float - SplitK=1
class TestGroupedConvndBwdData2dNHWGKFloatSplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData2dNHWGKFloatSplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<2, NHWGK, GKYXC, NHWGC, float>(GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData2dNHWGKFloatSplitK1,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - NHWGK layout - Float - SplitK=2
class TestGroupedConvndBwdData2dNHWGKFloatSplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData2dNHWGKFloatSplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<2, NHWGK, GKYXC, NHWGC, float>(GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData2dNHWGKFloatSplitK2,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - NHWGK layout - Half - SplitK=1
class TestGroupedConvndBwdData2dNHWGKHalfSplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData2dNHWGKHalfSplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<2, NHWGK, GKYXC, NHWGC, ck::half_t>(GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData2dNHWGKHalfSplitK1,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - NHWGK layout - Half - SplitK=2
class TestGroupedConvndBwdData2dNHWGKHalfSplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData2dNHWGKHalfSplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<2, NHWGK, GKYXC, NHWGC, ck::half_t>(GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData2dNHWGKHalfSplitK2,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - NHWGK layout - BFloat16 - SplitK=1
class TestGroupedConvndBwdData2dNHWGKBFloat16SplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData2dNHWGKBFloat16SplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<2, NHWGK, GKYXC, NHWGC, ck::bhalf_t>(GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData2dNHWGKBFloat16SplitK1,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - NHWGK layout - BFloat16 - SplitK=2
class TestGroupedConvndBwdData2dNHWGKBFloat16SplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData2dNHWGKBFloat16SplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<2, NHWGK, GKYXC, NHWGC, ck::bhalf_t>(GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData2dNHWGKBFloat16SplitK2,
::testing::ValuesIn(Get2DTestCases()));
// 3D Tests - NDHWGK layout - Float - SplitK=1
class TestGroupedConvndBwdData3dNDHWGKFloatSplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData3dNDHWGKFloatSplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<3, NDHWGK, GKZYXC, NDHWGC, float>(GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData3dNDHWGKFloatSplitK1,
::testing::ValuesIn(Get3DTestCases()));
// 3D Tests - NDHWGK layout - Float - SplitK=2
class TestGroupedConvndBwdData3dNDHWGKFloatSplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData3dNDHWGKFloatSplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<3, NDHWGK, GKZYXC, NDHWGC, float>(GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData3dNDHWGKFloatSplitK2,
::testing::ValuesIn(Get3DTestCases()));
// 3D Tests - NDHWGK layout - Half - SplitK=1
class TestGroupedConvndBwdData3dNDHWGKHalfSplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData3dNDHWGKHalfSplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<3, NDHWGK, GKZYXC, NDHWGC, ck::half_t>(GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData3dNDHWGKHalfSplitK1,
::testing::ValuesIn(Get3DTestCases()));
// 3D Tests - NDHWGK layout - Half - SplitK=2
class TestGroupedConvndBwdData3dNDHWGKHalfSplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData3dNDHWGKHalfSplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<3, NDHWGK, GKZYXC, NDHWGC, ck::half_t>(GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData3dNDHWGKHalfSplitK2,
::testing::ValuesIn(Get3DTestCases()));
// 3D Tests - NDHWGK layout - BFloat16 - SplitK=1
class TestGroupedConvndBwdData3dNDHWGKBFloat16SplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData3dNDHWGKBFloat16SplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<3, NDHWGK, GKZYXC, NDHWGC, ck::bhalf_t>(GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData3dNDHWGKBFloat16SplitK1,
::testing::ValuesIn(Get3DTestCases()));
// 3D Tests - NDHWGK layout - BFloat16 - SplitK=2
class TestGroupedConvndBwdData3dNDHWGKBFloat16SplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdData3dNDHWGKBFloat16SplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdDataTest<3, NDHWGK, GKZYXC, NDHWGC, ck::bhalf_t>(GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdData3dNDHWGKBFloat16SplitK2,
::testing::ValuesIn(Get3DTestCases()));

View File

@@ -4,6 +4,10 @@
if(GPU_TARGETS MATCHES "gfx9|gfx11|gfx12")
add_gtest_executable(test_grouped_convnd_bwd_weight test_grouped_convnd_bwd_weight.cpp)
target_link_libraries(test_grouped_convnd_bwd_weight PRIVATE utility device_grouped_conv1d_bwd_weight_instance device_grouped_conv2d_bwd_weight_instance device_grouped_conv3d_bwd_weight_instance device_grouped_convnd_bwd_weight_instance)
add_executable(test_grouped_convnd_bwd_weight_dataset_xdl test_grouped_convnd_bwd_weight_dataset_xdl.cpp)
target_compile_options(test_grouped_convnd_bwd_weight_dataset_xdl PRIVATE -Wno-global-constructors -Wno-undef)
target_link_libraries(test_grouped_convnd_bwd_weight_dataset_xdl PRIVATE gtest_main getopt::getopt utility device_grouped_conv1d_bwd_weight_instance device_grouped_conv2d_bwd_weight_instance device_grouped_conv3d_bwd_weight_instance device_grouped_convnd_bwd_weight_instance)
elseif(DL_KERNELS)
add_gtest_executable(test_grouped_convnd_bwd_weight test_grouped_convnd_bwd_weight.cpp)
target_link_libraries(test_grouped_convnd_bwd_weight PRIVATE utility device_grouped_conv1d_bwd_weight_instance device_grouped_conv2d_bwd_weight_instance device_grouped_conv3d_bwd_weight_instance)

View File

@@ -0,0 +1,258 @@
// Copyright (c) Advanced Micro Devices, Inc., or its affiliates.
// SPDX-License-Identifier: MIT
#include <cstdlib> // Standard C library (exit codes, malloc)
#include <iostream> // C++ I/O streams (cout, cerr)
#include <initializer_list> // C++ initializer list support (unused here)
#include <vector> // C++ vector container - stores test cases
#include <string> // String operations
#include <gtest/gtest.h> // Google Test framework - provides TEST_P, INSTANTIATE_TEST_SUITE_P
#include "ck/utility/common_header.hpp"
#include "ck/tensor_operation/gpu/device/tensor_layout.hpp"
#include "ck/host_utility/device_prop.hpp"
#include "profiler/profile_grouped_conv_bwd_weight_impl.hpp" // The actual GPU profiler that does convolution work
#include "../common/csv_test_loader.hpp" // Shared CSV test case loader
using namespace ck::tensor_layout::convolution;
// Load CSV data for 2D tests
static std::vector<ck::utils::conv::ConvParam> Get2DTestCases()
{
static std::vector<ck::utils::conv::ConvParam> test_cases;
if(test_cases.empty())
{
std::string test_data_dir = ck::test::GetTestDataPath();
if(test_data_dir.empty())
{
std::cerr << "FATAL: test_data directory not found" << std::endl;
return test_cases;
}
std::vector<std::string> csv_paths = {test_data_dir + "/conv_test_set_2d_dataset.csv"};
bool loaded = ck::test::load_and_populate_test_cases(csv_paths, test_cases, "2D");
if(!loaded)
{
std::cerr << "FATAL: Failed to load 2D test cases from " << csv_paths[0] << std::endl;
}
}
return test_cases;
}
// Load CSV data for 3D tests
static std::vector<ck::utils::conv::ConvParam> Get3DTestCases()
{
static std::vector<ck::utils::conv::ConvParam> test_cases;
if(test_cases.empty())
{
std::string test_data_dir = ck::test::GetTestDataPath();
if(test_data_dir.empty())
{
std::cerr << "FATAL: test_data directory not found" << std::endl;
return test_cases;
}
std::vector<std::string> csv_paths = {test_data_dir + "/conv_test_set_3d_dataset.csv"};
bool loaded = ck::test::load_and_populate_test_cases(csv_paths, test_cases, "3D");
if(!loaded)
{
std::cerr << "FATAL: Failed to load 3D test cases from " << csv_paths[0] << std::endl;
}
}
return test_cases;
}
// Helper template to run a single backward weight convolution test
template <ck::index_t NDimSpatial,
typename InLayout,
typename WeiLayout,
typename OutLayout,
typename InDataType,
typename WeiDataType,
typename OutDataType>
bool RunConvBwdWeightTest(const ck::utils::conv::ConvParam& param, ck::index_t split_k)
{
return ck::profiler::profile_grouped_conv_bwd_weight_impl<NDimSpatial,
InLayout,
WeiLayout,
OutLayout,
InDataType,
WeiDataType,
OutDataType>(
true, // do_verification
1, // init_method
false, // do_log
false, // time_kernel
param, // ConvParam
std::to_string(split_k), // Split-K value as string
-1); // instance_index
}
// 2D Tests - NHWGK layout - Float - SplitK=1
class TestGroupedConvndBwdWeight2dNHWGKFloatSplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdWeight2dNHWGKFloatSplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdWeightTest<2, NHWGC, GKYXC, NHWGK, float, float, float>(GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdWeight2dNHWGKFloatSplitK1,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - NHWGK layout - Float - SplitK=2
class TestGroupedConvndBwdWeight2dNHWGKFloatSplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdWeight2dNHWGKFloatSplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdWeightTest<2, NHWGC, GKYXC, NHWGK, float, float, float>(GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdWeight2dNHWGKFloatSplitK2,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - NHWGK layout - Half - SplitK=1
class TestGroupedConvndBwdWeight2dNHWGKHalfSplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdWeight2dNHWGKHalfSplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdWeightTest<2, NHWGC, GKYXC, NHWGK, ck::half_t, ck::half_t, ck::half_t>(
GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdWeight2dNHWGKHalfSplitK1,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - NHWGK layout - Half - SplitK=2
class TestGroupedConvndBwdWeight2dNHWGKHalfSplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdWeight2dNHWGKHalfSplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdWeightTest<2, NHWGC, GKYXC, NHWGK, ck::half_t, ck::half_t, ck::half_t>(
GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdWeight2dNHWGKHalfSplitK2,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - NHWGK layout - BFloat16 - SplitK=1
class TestGroupedConvndBwdWeight2dNHWGKBFloat16SplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdWeight2dNHWGKBFloat16SplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdWeightTest<2, NHWGC, GKYXC, NHWGK, ck::bhalf_t, float, ck::bhalf_t>(
GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdWeight2dNHWGKBFloat16SplitK1,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - NHWGK layout - BFloat16 - SplitK=2
class TestGroupedConvndBwdWeight2dNHWGKBFloat16SplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdWeight2dNHWGKBFloat16SplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdWeightTest<2, NHWGC, GKYXC, NHWGK, ck::bhalf_t, float, ck::bhalf_t>(
GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdWeight2dNHWGKBFloat16SplitK2,
::testing::ValuesIn(Get2DTestCases()));
// 3D Tests - NDHWGK layout - Float - SplitK=1
class TestGroupedConvndBwdWeight3dNDHWGKFloatSplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdWeight3dNDHWGKFloatSplitK1, ConvTest)
{
EXPECT_TRUE(
(RunConvBwdWeightTest<3, NDHWGC, GKZYXC, NDHWGK, float, float, float>(GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdWeight3dNDHWGKFloatSplitK1,
::testing::ValuesIn(Get3DTestCases()));
// 3D Tests - NDHWGK layout - Float - SplitK=2
class TestGroupedConvndBwdWeight3dNDHWGKFloatSplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdWeight3dNDHWGKFloatSplitK2, ConvTest)
{
EXPECT_TRUE(
(RunConvBwdWeightTest<3, NDHWGC, GKZYXC, NDHWGK, float, float, float>(GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdWeight3dNDHWGKFloatSplitK2,
::testing::ValuesIn(Get3DTestCases()));
// 3D Tests - NDHWGK layout - Half - SplitK=1
class TestGroupedConvndBwdWeight3dNDHWGKHalfSplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdWeight3dNDHWGKHalfSplitK1, ConvTest)
{
EXPECT_TRUE(
(RunConvBwdWeightTest<3, NDHWGC, GKZYXC, NDHWGK, ck::half_t, ck::half_t, ck::half_t>(
GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdWeight3dNDHWGKHalfSplitK1,
::testing::ValuesIn(Get3DTestCases()));
// 3D Tests - NDHWGK layout - Half - SplitK=2
class TestGroupedConvndBwdWeight3dNDHWGKHalfSplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdWeight3dNDHWGKHalfSplitK2, ConvTest)
{
EXPECT_TRUE(
(RunConvBwdWeightTest<3, NDHWGC, GKZYXC, NDHWGK, ck::half_t, ck::half_t, ck::half_t>(
GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdWeight3dNDHWGKHalfSplitK2,
::testing::ValuesIn(Get3DTestCases()));
// 3D Tests - NDHWGK layout - BFloat16 - SplitK=1
class TestGroupedConvndBwdWeight3dNDHWGKBFloat16SplitK1
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdWeight3dNDHWGKBFloat16SplitK1, ConvTest)
{
EXPECT_TRUE((RunConvBwdWeightTest<3, NDHWGC, GKZYXC, NDHWGK, ck::bhalf_t, float, ck::bhalf_t>(
GetParam(), 1)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdWeight3dNDHWGKBFloat16SplitK1,
::testing::ValuesIn(Get3DTestCases()));
// 3D Tests - NDHWGK layout - BFloat16 - SplitK=2
class TestGroupedConvndBwdWeight3dNDHWGKBFloat16SplitK2
: public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndBwdWeight3dNDHWGKBFloat16SplitK2, ConvTest)
{
EXPECT_TRUE((RunConvBwdWeightTest<3, NDHWGC, GKZYXC, NDHWGK, ck::bhalf_t, float, ck::bhalf_t>(
GetParam(), 2)));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndBwdWeight3dNDHWGKBFloat16SplitK2,
::testing::ValuesIn(Get3DTestCases()));

View File

@@ -5,330 +5,165 @@
#include <iostream> // C++ I/O streams (cout, cerr)
#include <initializer_list> // C++ initializer list support (unused here)
#include <vector> // C++ vector container - stores test cases
#include <fstream> // File I/O for CSV reading
#include <sstream> // String stream for CSV parsing
#include <string> // String operations
#include <gtest/gtest.h> // Google Test framework - provides TYPED_TEST, EXPECT_TRUE
#include <gtest/gtest.h> // Google Test framework - provides TEST_P, INSTANTIATE_TEST_SUITE_P
#include "profiler/profile_grouped_conv_fwd_impl.hpp" // The actual GPU profiler that does convolution work
// CSV Reader Function for Loading Test Cases
// Reads convolution parameters from CSV file and returns vector of ConvParam structures
std::vector<ck::utils::conv::ConvParam> load_csv_test_cases(const std::string& filename)
{
std::vector<ck::utils::conv::ConvParam> conv_params; // Return vector
std::ifstream file(filename); // Open CSV file
if(!file.is_open())
{
std::cerr << "ERROR: Cannot open CSV file: " << filename << std::endl;
return conv_params; // Return empty vector on error
}
std::string line;
int line_number = 0;
// Read file line by line
while(std::getline(file, line))
{
line_number++;
// Skip comment lines (starting with #) and empty lines
if(line.empty() || line[0] == '#')
{
continue;
}
// Skip header line (contains column names)
if(line.find("NDim,Groups,BatchSize") != std::string::npos)
{
continue;
}
// Parse CSV line using stringstream
std::stringstream ss(line);
std::string cell;
std::vector<std::string> row;
// Split line by commas
while(std::getline(ss, cell, ','))
{
row.push_back(cell);
}
// Validate row has correct number of columns
if(row.size() < 19)
{ // Need at least 19 columns for 2D (excluding TestName)
std::cerr << "WARNING: Line " << line_number << " has insufficient columns ("
<< row.size() << "), skipping" << std::endl;
continue;
}
try
{
// Parse CSV data into ConvParam structure
// CSV Format:
// NDim,Groups,BatchSize,OutChannels,InChannels,KernelH,KernelW,InputH,InputW,OutputH,OutputW,StrideH,StrideW,DilationH,DilationW,LeftPadH,LeftPadW,RightPadH,RightPadW,TestName
int NDim = std::stoi(row[0]);
int Groups = std::stoi(row[1]);
int BatchSize = std::stoi(row[2]);
int OutChannels = std::stoi(row[3]);
int InChannels = std::stoi(row[4]);
if(NDim == 2)
{
// 2D Convolution: {NDim, Groups, BatchSize, OutChannels, InChannels,
// {KernelH,KernelW}, {InputH,InputW}, {StrideH,StrideW}, {DilationH,DilationW},
// {LeftPadH,LeftPadW}, {RightPadH,RightPadW}}
ck::utils::conv::ConvParam param = {
NDim, // NDim = 2
Groups, // Groups
BatchSize, // Batch size
OutChannels, // Output channels
InChannels, // Input channels
{std::stoi(row[5]), std::stoi(row[6])}, // Kernel: {H, W}
{std::stoi(row[7]), std::stoi(row[8])}, // Input: {H, W}
{std::stoi(row[11]), std::stoi(row[12])}, // Stride: {H, W}
{std::stoi(row[13]), std::stoi(row[14])}, // Dilation: {H, W}
{std::stoi(row[15]), std::stoi(row[16])}, // Left pad: {H, W}
{std::stoi(row[17]), std::stoi(row[18])} // Right pad: {H, W}
};
conv_params.push_back(param);
}
else if(NDim == 3)
{
// 3D Convolution: Need more columns for 3D parameters
if(row.size() < 26)
{
std::cerr << "WARNING: 3D convolution on line " << line_number
<< " needs 26+ columns, has " << row.size() << ", skipping"
<< std::endl;
continue;
}
// 3D Convolution: {NDim, Groups, BatchSize, OutChannels, InChannels,
// {KernelD,KernelH,KernelW}, {InputD,InputH,InputW}, {OutputD,OutputH,OutputW},
// {StrideD,StrideH,StrideW}, {DilationD,DilationH,DilationW},
// {LeftPadD,LeftPadH,LeftPadW}, {RightPadD,RightPadH,RightPadW}}
ck::utils::conv::ConvParam param = {
NDim, // NDim = 3
Groups, // Groups
BatchSize, // Batch size
OutChannels, // Output channels
InChannels, // Input channels
{std::stoi(row[5]), std::stoi(row[6]), std::stoi(row[7])}, // Kernel: {D, H, W}
{std::stoi(row[8]), std::stoi(row[9]), std::stoi(row[10])}, // Input: {D, H, W}
{std::stoi(row[14]),
std::stoi(row[15]),
std::stoi(row[16])}, // Stride: {D, H, W}
{std::stoi(row[17]),
std::stoi(row[18]),
std::stoi(row[19])}, // Dilation: {D, H, W}
{std::stoi(row[20]),
std::stoi(row[21]),
std::stoi(row[22])}, // Left pad: {D, H, W}
{std::stoi(row[23]),
std::stoi(row[24]),
std::stoi(row[25])} // Right pad: {D, H, W}
};
conv_params.push_back(param);
}
else
{
std::cerr << "WARNING: Unsupported NDim=" << NDim << " on line " << line_number
<< ", skipping" << std::endl;
}
}
catch(const std::exception& e)
{
std::cerr << "ERROR: Failed to parse line " << line_number << ": " << e.what()
<< std::endl;
continue;
}
}
file.close();
std::cout << "Loaded " << conv_params.size() << " test cases from " << filename << std::endl;
return conv_params;
}
// Template class that works with different data types and tensor layouts
template <typename Tuple>
class TestGroupedConvndFwd : public ::testing::Test // Inherit from Google Test base class
{
protected:
using DataType =
std::tuple_element_t<0, Tuple>; // Extract data type from tuple (fp32, fp16, bf16, int8)
using InLayout =
std::tuple_element_t<1, Tuple>; // Extract input tensor layout (NHWGC, NDHWGC, etc.)
using WeiLayout =
std::tuple_element_t<2, Tuple>; // Extract weight tensor layout (GKYXC, GKZYXC, etc.)
using OutLayout =
std::tuple_element_t<3, Tuple>; // Extract output tensor layout (NHWGK, NDHWGK, etc.)
using IndexType = ck::long_index_t; // 64-bit integer type for tensor dimensions
// THE KEY CONTAINER: This stores all test case parameters
// Each test will push_back() ConvParam structures here
std::vector<ck::utils::conv::ConvParam> conv_params;
// Template function to run tests for N-dimensional spatial convolution (2D or 3D)
template <ck::index_t NDimSpatial>
void Run()
{
EXPECT_FALSE(conv_params.empty()); // Google Test assertion: ensure we have test cases
bool pass = true; // Track overall pass/fail across all test cases
// MAIN LOOP: Execute every test case that was added to conv_params
for(auto& param : conv_params)
{
// CALL THE ACTUAL GPU PROFILER - This is where convolution happens!
pass = pass &&
ck::profiler::profile_grouped_conv_fwd_impl<NDimSpatial,
InLayout, // Input tensor layout
WeiLayout, // Weight tensor layout
OutLayout, // Output tensor layout
DataType, // Input data type
DataType, // Weight data type
DataType, // Output data type
DataType, // Accumulation type
DataType, // Bias type
IndexType>( // Index type (int64)
true, // do_verification: Compare GPU result with CPU reference
1, // init_method: How to initialize random test data (1 = uniform -5 to 5)
false, // do_log: Don't print detailed tensor values
false, // time_kernel: Don't do performance timing (just correctness)
param); // ConvParam: {NDim, Groups, Batch, OutChannels, InChannels,
// KernelSize, InputSize, ...}
}
EXPECT_TRUE(pass); // Google Test assertion: ALL test cases must pass
}
};
#include "../common/csv_test_loader.hpp" // Shared CSV test case loader
using namespace ck::tensor_layout::convolution; // Import tensor layout names (NHWGC, GKYXC, etc.)
// GOOGLE TEST TYPE COMBINATIONS: Define what data types and layouts to test
// This creates 4 separate test instances for 2D convolution:
using KernelTypes2d =
::testing::Types<std::tuple<float, NHWGC, GKYXC, NHWGK>, // fp32 test
std::tuple<ck::half_t, NHWGC, GKYXC, NHWGK>, // fp16 test
std::tuple<ck::bhalf_t, NHWGC, GKYXC, NHWGK>, // bfloat16 test
std::tuple<int8_t, NHWGC, GKYXC, NHWGK>>; // int8 test
// This creates 3 separate test instances for 3D convolution (no int8 support for 3D):
using KernelTypes3d =
::testing::Types<std::tuple<float, NDHWGC, GKZYXC, NDHWGK>, // fp32 3D test
std::tuple<ck::half_t, NDHWGC, GKZYXC, NDHWGK>, // fp16 3D test
std::tuple<ck::bhalf_t, NDHWGC, GKZYXC, NDHWGK>>; // bfloat16 3D test
// Create specialized test classes that inherit from the base template class
template <typename Tuple>
class TestGroupedConvndFwd2d : public TestGroupedConvndFwd<Tuple> // 2D convolution test class
// Load CSV data for 2D tests
static std::vector<ck::utils::conv::ConvParam> Get2DTestCases()
{
};
template <typename Tuple>
class TestGroupedConvndFwd3d : public TestGroupedConvndFwd<Tuple> // 3D convolution test class
{
};
// GOOGLE TEST MAGIC: Create test suites
// This tells Google Test to create 4 test instances for 2D (fp32, fp16, bf16, int8)
TYPED_TEST_SUITE(TestGroupedConvndFwd2d, KernelTypes2d);
// This tells Google Test to create 3 test instances for 3D (fp32, fp16, bf16)
TYPED_TEST_SUITE(TestGroupedConvndFwd3d, KernelTypes3d);
// THE ACTUAL 2D TEST - This runs 4 times (once for each data type: fp32, fp16, bf16, int8)
TYPED_TEST(TestGroupedConvndFwd2d, Test2D)
{
// LOAD TEST CASES FROM CSV FILE instead of hardcoded cases
// Try different locations for the CSV file (build directory vs source directory)
std::vector<std::string> csv_paths = {
"../test_data/conv_test_set_2d_dataset.csv", // From build directory to source
};
bool loaded = false;
for(const auto& csv_path : csv_paths)
static std::vector<ck::utils::conv::ConvParam> test_cases;
if(test_cases.empty())
{
auto csv_cases = load_csv_test_cases(csv_path);
if(!csv_cases.empty())
std::string test_data_dir = ck::test::GetTestDataPath();
if(test_data_dir.empty())
{
// Successfully loaded CSV data - add all test cases to conv_params
for(const auto& test_case : csv_cases)
{
this->conv_params.push_back(test_case);
}
std::cout << "Loaded " << csv_cases.size() << " 2D test cases from " << csv_path
<< std::endl;
loaded = true;
break;
std::cerr << "FATAL: test_data directory not found" << std::endl;
return test_cases;
}
std::vector<std::string> csv_paths = {test_data_dir + "/conv_test_set_2d_dataset.csv"};
bool loaded = ck::test::load_and_populate_test_cases(csv_paths, test_cases, "2D");
if(!loaded)
{
std::cerr << "FATAL: Failed to load 2D test cases from " << csv_paths[0] << std::endl;
}
}
// FAIL if CSV loading fails - no fallback!
if(!loaded)
{
std::cerr << "ERROR: Failed to load CSV test data from any of these locations:"
<< std::endl;
for(const auto& path : csv_paths)
{
std::cerr << " - " << path << std::endl;
}
std::cerr << "\nPlease ensure CSV test data exists in one of these locations." << std::endl;
std::cerr << "Run generate_test_dataset.sh in test_data/ to create test datasets."
<< std::endl;
// Force test failure - no test cases means test should fail
EXPECT_TRUE(loaded) << "CSV test data loading failed";
}
// Execute all test cases with 2D convolution
// This calls Run<2>() which loops through conv_params and calls GPU profiler for each
this->template Run<2>();
return test_cases;
}
// THE ACTUAL 3D TEST - This runs 3 times (once for each data type: fp32, fp16, bf16)
TYPED_TEST(TestGroupedConvndFwd3d, Test3D)
// Load CSV data for 3D tests
static std::vector<ck::utils::conv::ConvParam> Get3DTestCases()
{
// LOAD TEST CASES FROM CSV FILE instead of hardcoded cases
// Try different locations for the CSV file (build directory vs source directory)
std::vector<std::string> csv_paths = {
"../test_data/conv_test_set_3d_dataset.csv", // From build directory to source
};
bool loaded = false;
for(const auto& csv_path : csv_paths)
static std::vector<ck::utils::conv::ConvParam> test_cases;
if(test_cases.empty())
{
auto csv_cases = load_csv_test_cases(csv_path);
if(!csv_cases.empty())
std::string test_data_dir = ck::test::GetTestDataPath();
if(test_data_dir.empty())
{
// Successfully loaded CSV data - add all test cases to conv_params
for(const auto& test_case : csv_cases)
{
this->conv_params.push_back(test_case);
}
std::cout << "Loaded " << csv_cases.size() << " 3D test cases from " << csv_path
<< std::endl;
loaded = true;
break;
std::cerr << "FATAL: test_data directory not found" << std::endl;
return test_cases;
}
std::vector<std::string> csv_paths = {test_data_dir + "/conv_test_set_3d_dataset.csv"};
bool loaded = ck::test::load_and_populate_test_cases(csv_paths, test_cases, "3D");
if(!loaded)
{
std::cerr << "FATAL: Failed to load 3D test cases from " << csv_paths[0] << std::endl;
}
}
// FAIL if CSV loading fails - no fallback!
if(!loaded)
{
std::cerr << "ERROR: Failed to load CSV test data from any of these locations:"
<< std::endl;
for(const auto& path : csv_paths)
{
std::cerr << " - " << path << std::endl;
}
std::cerr << "\nPlease ensure CSV test data exists in one of these locations." << std::endl;
std::cerr << "Run generate_test_dataset.sh in test_data/ to create test datasets."
<< std::endl;
// Force test failure - no test cases means test should fail
EXPECT_TRUE(loaded) << "CSV test data loading failed";
}
// Execute all test cases with 3D convolution
// This calls Run<3>() which loops through conv_params and calls GPU profiler for each
this->template Run<3>();
return test_cases;
}
// Helper template to run a single convolution test
template <ck::index_t NDimSpatial,
typename InLayout,
typename WeiLayout,
typename OutLayout,
typename DataType>
bool RunConvTest(const ck::utils::conv::ConvParam& param)
{
using IndexType = ck::long_index_t;
return ck::profiler::profile_grouped_conv_fwd_impl<NDimSpatial,
InLayout,
WeiLayout,
OutLayout,
DataType,
DataType,
DataType,
DataType,
DataType,
IndexType>(true, // do_verification
1, // init_method
false, // do_log
false, // time_kernel
param);
}
// 2D Tests - Float
class TestGroupedConvndFwd2dFloat : public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndFwd2dFloat, ConvTest)
{
EXPECT_TRUE((RunConvTest<2, NHWGC, GKYXC, NHWGK, float>(GetParam())));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndFwd2dFloat,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - Half
class TestGroupedConvndFwd2dHalf : public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndFwd2dHalf, ConvTest)
{
EXPECT_TRUE((RunConvTest<2, NHWGC, GKYXC, NHWGK, ck::half_t>(GetParam())));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndFwd2dHalf,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - BFloat16
class TestGroupedConvndFwd2dBFloat16 : public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndFwd2dBFloat16, ConvTest)
{
EXPECT_TRUE((RunConvTest<2, NHWGC, GKYXC, NHWGK, ck::bhalf_t>(GetParam())));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndFwd2dBFloat16,
::testing::ValuesIn(Get2DTestCases()));
// 2D Tests - Int8
class TestGroupedConvndFwd2dInt8 : public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndFwd2dInt8, ConvTest)
{
EXPECT_TRUE((RunConvTest<2, NHWGC, GKYXC, NHWGK, int8_t>(GetParam())));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndFwd2dInt8,
::testing::ValuesIn(Get2DTestCases()));
// 3D Tests - Float
class TestGroupedConvndFwd3dFloat : public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndFwd3dFloat, ConvTest)
{
EXPECT_TRUE((RunConvTest<3, NDHWGC, GKZYXC, NDHWGK, float>(GetParam())));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndFwd3dFloat,
::testing::ValuesIn(Get3DTestCases()));
// 3D Tests - Half
class TestGroupedConvndFwd3dHalf : public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndFwd3dHalf, ConvTest)
{
EXPECT_TRUE((RunConvTest<3, NDHWGC, GKZYXC, NDHWGK, ck::half_t>(GetParam())));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndFwd3dHalf,
::testing::ValuesIn(Get3DTestCases()));
// 3D Tests - BFloat16
class TestGroupedConvndFwd3dBFloat16 : public ::testing::TestWithParam<ck::utils::conv::ConvParam>
{
};
TEST_P(TestGroupedConvndFwd3dBFloat16, ConvTest)
{
EXPECT_TRUE((RunConvTest<3, NDHWGC, GKZYXC, NDHWGK, ck::bhalf_t>(GetParam())));
}
INSTANTIATE_TEST_SUITE_P(Dataset,
TestGroupedConvndFwd3dBFloat16,
::testing::ValuesIn(Get3DTestCases()));