mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-21 21:39:15 +00:00
* enabled atomic add in tensor copy
* added gridwise GEMM
* added backward data conv using GEMM + atomic
* added backward data conv using GEMM, no atomic
[ROCm/composable_kernel commit: 8f5f64960e]
33 lines
993 B
CMake
33 lines
993 B
CMake
set(TENSOR_SOURCE
|
|
src/tensor.cpp;
|
|
src/device.cpp;
|
|
)
|
|
|
|
add_library(host SHARED ${TENSOR_SOURCE})
|
|
target_compile_features(host PUBLIC)
|
|
set_target_properties(host PROPERTIES POSITION_INDEPENDENT_CODE ON)
|
|
|
|
if(DEVICE_BACKEND STREQUAL "NVIDIA")
|
|
target_link_libraries(host nvToolsExt cudart)
|
|
endif()
|
|
|
|
install(TARGETS host LIBRARY DESTINATION lib)
|
|
|
|
|
|
if(DEVICE_BACKEND STREQUAL "AMD")
|
|
set(CONV_SOURCE src/conv_driver.cpp)
|
|
set(COL2IM_SOURCE src/col2im_driver.cpp)
|
|
set(CONV_BWD_DATA_SOURCE src/conv_bwd_data_driver.cpp)
|
|
elseif(DEVICE_BACKEND STREQUAL "NVIDIA")
|
|
set(CONV_SOURCE src/conv_driver.cu)
|
|
set(COL2IM_SOURCE src/col2im_driver.cu)
|
|
set(CONV_BWD_DATA_SOURCE src/conv_bwd_data_driver.cu)
|
|
endif()
|
|
|
|
add_executable(conv ${CONV_SOURCE})
|
|
add_executable(col2im ${COL2IM_SOURCE})
|
|
add_executable(conv_bwd_data ${CONV_BWD_DATA_SOURCE})
|
|
target_link_libraries(conv PRIVATE host)
|
|
target_link_libraries(col2im PRIVATE host)
|
|
target_link_libraries(conv_bwd_data PRIVATE host)
|