mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-21 13:29:20 +00:00
* Add optimized blockwise gemm using ck wrapper
* Add basic gemm example
* Update docs
* Add tutorial for gemm using ck wrapper
* Add perf note
* edits
* Fix cmake
* Fixes
---------
Co-authored-by: Lisa Delaney <lisa.delaney@amd.com>
[ROCm/composable_kernel commit: 1e73adbc28]
22 lines
1.1 KiB
CMake
22 lines
1.1 KiB
CMake
add_custom_target(test_wrapper)
|
|
|
|
add_gtest_executable(test_wrapper_layout test_wrapper_layout.cpp)
|
|
target_link_libraries(test_wrapper_layout PRIVATE utility)
|
|
add_dependencies(test_wrapper test_wrapper_layout)
|
|
add_gtest_executable(test_wrapper_tensor test_wrapper_tensor.cpp)
|
|
target_link_libraries(test_wrapper_tensor PRIVATE utility)
|
|
add_dependencies(test_wrapper test_wrapper_tensor)
|
|
add_gtest_executable(test_wrapper_copy test_wrapper_copy.cpp)
|
|
target_link_libraries(test_wrapper_copy PRIVATE utility)
|
|
add_dependencies(test_wrapper test_wrapper_copy)
|
|
add_gtest_executable(test_wrapper_partition test_wrapper_partition.cpp)
|
|
target_link_libraries(test_wrapper_partition PRIVATE utility)
|
|
add_dependencies(test_wrapper test_wrapper_partition)
|
|
if(GPU_TARGETS MATCHES "gfx908" OR GPU_TARGETS MATCHES "gfx90a" OR
|
|
GPU_TARGETS MATCHES "gfx940" OR GPU_TARGETS MATCHES "gfx941" OR
|
|
GPU_TARGETS MATCHES "gfx942")
|
|
add_gtest_executable(test_wrapper_gemm test_wrapper_gemm.cpp)
|
|
target_link_libraries(test_wrapper_gemm PRIVATE utility)
|
|
add_dependencies(test_wrapper test_wrapper_gemm)
|
|
endif()
|