mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-19 12:30:16 +00:00
* Add optimized blockwise gemm using ck wrapper
* Add basic gemm example
* Update docs
* Add tutorial for gemm using ck wrapper
* Add perf note
* edits
* Fix cmake
* Fixes
---------
Co-authored-by: Lisa Delaney <lisa.delaney@amd.com>
[ROCm/composable_kernel commit: 1e73adbc28]
13 lines
890 B
CMake
13 lines
890 B
CMake
add_executable(client_tensor_transform_using_wrapper tensor_transform_using_wrapper.cpp)
|
|
target_link_libraries(client_tensor_transform_using_wrapper PRIVATE composable_kernel::device_other_operations)
|
|
add_executable(client_wrapper_img2col wrapper_img2col.cpp)
|
|
target_link_libraries(client_wrapper_img2col PRIVATE composable_kernel::device_other_operations)
|
|
if(GPU_TARGETS MATCHES "gfx908" OR GPU_TARGETS MATCHES "gfx90a" OR
|
|
GPU_TARGETS MATCHES "gfx940" OR GPU_TARGETS MATCHES "gfx941" OR
|
|
GPU_TARGETS MATCHES "gfx942")
|
|
add_executable(client_wrapper_basic_gemm wrapper_basic_gemm.cpp)
|
|
target_link_libraries(client_wrapper_basic_gemm PRIVATE composable_kernel::device_other_operations)
|
|
add_executable(client_wrapper_optimized_gemm wrapper_optimized_gemm.cpp)
|
|
target_link_libraries(client_wrapper_optimized_gemm PRIVATE composable_kernel::device_other_operations)
|
|
endif()
|