mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-07-03 13:48:30 +00:00
Replace inline lambdas with named functor structs in transform_tensor_descriptor to reduce template instantiation overhead and improve compile times. Changes: - Add three named functors in tensor_descriptor.hpp: - convert_visible_to_hidden_id: maps visible dimension ID to hidden ID - convert_visible_ids_to_hidden_ids: maps sequence of visible IDs to hidden IDs - generate_arithmetic_sequence_from_scan: generates consecutive hidden dim ID ranges - Add utility functions in sequence_helper.hpp and tuple_helper.hpp: - unpack_and_merge_sequences(): unpacks tuple of sequences and merges them - generate_identity_sequences(): creates Tuple<Sequence<0>, Sequence<1>, ...> - Update 14 call sites across threadwise transfer, wrapper, and device files to use generate_identity_sequences() instead of generate_tuple with lambdas - Add comprehensive unit tests: - unit_sequence_helper.cpp: tests for new utility functions - unit_tensor_descriptor_functors.cpp: tests for new functors Co-Authored-By: Claude <noreply@anthropic.com>
66 lines
2.3 KiB
C++
66 lines
2.3 KiB
C++
// Copyright (c) Advanced Micro Devices, Inc., or its affiliates.
|
|
// SPDX-License-Identifier: MIT
|
|
|
|
#include <gtest/gtest.h>
|
|
#include "ck/utility/sequence_helper.hpp"
|
|
#include "ck/utility/tuple_helper.hpp"
|
|
|
|
using namespace ck;
|
|
|
|
// Tests for generate_identity_sequences (PR #3588)
|
|
TEST(GenerateIdentitySequences, Size5)
|
|
{
|
|
auto result = generate_identity_sequences(Number<5>{});
|
|
auto expected =
|
|
make_tuple(Sequence<0>{}, Sequence<1>{}, Sequence<2>{}, Sequence<3>{}, Sequence<4>{});
|
|
EXPECT_TRUE((is_same<decltype(result), decltype(expected)>::value));
|
|
}
|
|
|
|
TEST(GenerateIdentitySequences, Size1)
|
|
{
|
|
auto result = generate_identity_sequences(Number<1>{});
|
|
auto expected = make_tuple(Sequence<0>{});
|
|
EXPECT_TRUE((is_same<decltype(result), decltype(expected)>::value));
|
|
}
|
|
|
|
TEST(GenerateIdentitySequences, Size0)
|
|
{
|
|
auto result = generate_identity_sequences(Number<0>{});
|
|
auto expected = make_tuple();
|
|
EXPECT_TRUE((is_same<decltype(result), decltype(expected)>::value));
|
|
}
|
|
|
|
TEST(GenerateIdentitySequences, WithNumber)
|
|
{
|
|
constexpr auto result = generate_identity_sequences(Number<3>{});
|
|
EXPECT_EQ(result.Size(), 3);
|
|
EXPECT_TRUE((is_same<decltype(result.At(Number<0>{})), const Sequence<0>&>::value));
|
|
EXPECT_TRUE((is_same<decltype(result.At(Number<1>{})), const Sequence<1>&>::value));
|
|
EXPECT_TRUE((is_same<decltype(result.At(Number<2>{})), const Sequence<2>&>::value));
|
|
}
|
|
|
|
// Tests for unpack_and_merge_sequences (PR #3589)
|
|
TEST(UnpackAndMergeSequences, MergeMultipleSequences)
|
|
{
|
|
auto input = make_tuple(Sequence<1, 2>{}, Sequence<3, 4>{}, Sequence<5, 6>{});
|
|
auto result = unpack_and_merge_sequences(input);
|
|
auto expected = Sequence<1, 2, 3, 4, 5, 6>{};
|
|
EXPECT_TRUE((is_same<decltype(result), decltype(expected)>::value));
|
|
}
|
|
|
|
TEST(UnpackAndMergeSequences, SingleSequence)
|
|
{
|
|
auto input = make_tuple(Sequence<10, 20, 30>{});
|
|
auto result = unpack_and_merge_sequences(input);
|
|
auto expected = Sequence<10, 20, 30>{};
|
|
EXPECT_TRUE((is_same<decltype(result), decltype(expected)>::value));
|
|
}
|
|
|
|
TEST(UnpackAndMergeSequences, TwoSequences)
|
|
{
|
|
auto input = make_tuple(Sequence<100>{}, Sequence<200, 300>{});
|
|
auto result = unpack_and_merge_sequences(input);
|
|
auto expected = Sequence<100, 200, 300>{};
|
|
EXPECT_TRUE((is_same<decltype(result), decltype(expected)>::value));
|
|
}
|