Files
blis/addon/CMakeLists.txt
Balasubramanian, Vignesh 73911d5990 Updates to the build systems(CMake and Make) for LPGEMM compilation (#303)
- The current build systems have the following behaviour
  with regards to building "aocl_gemm" addon codebase(LPGEMM)
  when giving "amdzen" as the target architecture(fat-binary)
  - Make:  Attempts to compile LPGEMM kernels using the same
                compiler flags that the makefile fragments set for BLIS
                kernels, based on the compiler version.
  - CMake: With presets, it always enables the addon compilation
                 unless explicitly specified with the ENABLE_ADDON variable.

- This poses a bug with older compilers, owing to them not supporting
  BF16 or INT8 intrinsic compilation.

- This patch adds the functionality to check for GCC and Clang compiler versions,
  and disables LPGEMM compilation if GCC < 11.2 or Clang < 12.0.

- Make:  Updated the configure script to check for the compiler version
              if the addon is specified.
  CMake: Updated the main CMakeLists.txt to check for the compiler version
               if the addon is specified, and to also force-update the associated
               cache variable update. Also updated kernels/CMakeLists.txt to
               check if "aocl_gemm" remains in the ENABLE_ADDONS list after
               all the checks in the previous layers.

AMD-Internal: [CPUPL-7850]

Signed-off by : Vignesh Balasubramanian <Vignesh.Balasubramanian@amd.com>
2026-01-16 19:39:55 +05:30

237 lines
12 KiB
CMake

#[=[
BLIS
An object-based framework for developing high-performance BLAS-like
libraries.
Copyright (C) 2023 - 2025, Advanced Micro Devices, Inc. All rights reserved.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are
met:
- Redistributions of source code must retain the above copyright
notice, this list of conditions and the following disclaimer.
- Redistributions in binary form must reproduce the above copyright
notice, this list of conditions and the following disclaimer in the
documentation and/or other materials provided with the distribution.
- Neither the name(s) of the copyright holder(s) nor the names of its
contributors may be used to endorse or promote products derived
from this software without specific prior written permission.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
]=]
# Writing a function that will be used to generate the required object
# libraries for the required addons.
function(generate_addon_targets addon_target)
# Collect all subdirectory paths that have at least one file with suffix in ADDON_C99_SUFS list.
get_filepaths_with_suffixes(LOCAL_SOURCE_C99_FILES "${CMAKE_CURRENT_SOURCE_DIR}/${addon_target}" "${ADDON_C99_SUFS}")
# We want to break the files above in 2 categories, files in kernel directory and the rest.
# Only list files in kernel directory.
set(LOCAL_KERNEL_FILES_C99 ${LOCAL_SOURCE_FILES})
list(FILTER LOCAL_KERNEL_FILES_C99 INCLUDE REGEX ${addon_target}/kernels/)
# All C99 files, except of the ones in kernels directory.
list(REMOVE_ITEM LOCAL_SOURCE_C99_FILES ${LOCAL_KERNEL_FILES_C99})
# Collect all subdirectory paths that have at least one file with suffix in ADDON_H99_SUFS list.
get_dirpaths_with_suffixes(CADDONINCFLAGS "${CMAKE_CURRENT_SOURCE_DIR}/${addon_target}" "${ADDON_H99_SUFS}")
# Only generate the object library if there is at least one source file.
list(LENGTH LOCAL_SOURCE_C99_FILES size)
if(size GREATER 0)
# Create an object library using the source file list above.
add_library(${addon_target}_C99_ADDON
OBJECT
${LOCAL_SOURCE_C99_FILES}
)
# Include the corresponding make_defs.cmake that holds the required compiler options.
include(${PROJECT_SOURCE_DIR}/config/${BLIS_CONFIG_FAMILY}/make_defs.cmake)
# Use PRIVATE keyword for option setting since we do not want the properties to propagate in other targets.
# mimicing get-addon-c99flags-for
target_compile_options(${addon_target}_C99_ADDON
PRIVATE
# load-var-for,COPTFLAGS
${COPTFLAGS}
# get-noopt-cflags-for
${CDBGFLAGS}
# get-noopt-cflags-for
${CWARNFLAGS}
# get-noopt-cflags-for
${CMISCFLAGS}
# get-noopt-cflags-for
${CLANGFLAGS}
# in get-addon-c99flags-for
${BUILD_SYMFLAGS}
)
target_compile_definitions(${addon_target}_C99_ADDON
PRIVATE
# in get-noopt-cflags-for
${CPPROCFLAGS}
# in get-noopt-cflags-for
${VERS_DEF}
# in get-addon-c99flags-for
${BUILD_CPPFLAGS}
)
target_include_directories(${addon_target}_C99_ADDON
BEFORE
PRIVATE
# in get-noopt-cflags-for
${CINFLAGS}
# in get-addon-c99flags-for
${CADDONINCFLAGS}
)
if(THREADING_MODEL STREQUAL "openmp")
# Equivalent to CTHREADFLAGS in get-noopt-cflags-for
target_link_libraries(${addon_target}_C99_ADDON PRIVATE OpenMP::OpenMP_C)
elseif(THREADING_MODEL STREQUAL "pthreads")
# in get-noopt-cflags-for
target_compile_options(${addon_target}_C99_ADDON PRIVATE ${CTHREADFLAGS})
endif()
# Equivalent to CPICFLAGS in get-noopt-cflags-for
set_target_properties(${addon_target}_C99_ADDON PROPERTIES POSITION_INDEPENDENT_CODE ON)
add_dependencies(${addon_target}_C99_ADDON flat-header)
# Put all those targets under object-libs-targets folder name so that they appear all together in IDE.
set_target_properties(${addon_target}_C99_ADDON PROPERTIES FOLDER object-libs-targets)
endif()
# Only generate the object library if there is at least one source file.
list(LENGTH LOCAL_KERNEL_FILES_C99 size)
if(size GREATER 0)
# Create an object library using the kernel source file list above.
add_library(${addon_target}_C99_KERNEL_ADDON
OBJECT
${LOCAL_KERNEL_FILES_C99}
)
# Include the corresponding make_defs.cmake that holds the required compiler options.
include(${PROJECT_SOURCE_DIR}/config/${BLIS_CONFIG_FAMILY}/make_defs.cmake)
# Use PRIVATE keyword for option setting since we do not want the properties to propagate in other targets.
# mimicing get-addon-c99flags-for
target_compile_options(${addon_target}_C99_KERNEL_ADDON
PRIVATE
# load-var-for,CKOPTFLAGS
${CKOPTFLAGS}
# load-var-for,CKVECFLAGS
${CKVECFLAGS}
# get-noopt-cflags-for
${CDBGFLAGS}
# get-noopt-cflags-for
${CWARNFLAGS}
# get-noopt-cflags-for
${CMISCFLAGS}
# get-noopt-cflags-for
${CLANGFLAGS}
# in get-addon-kernel-c99flags-for
${BUILD_SYMFLAGS}
)
target_compile_definitions(${addon_target}_C99_KERNEL_ADDON
PRIVATE
# in get-noopt-cflags-for
${CPPROCFLAGS}
# in get-noopt-cflags-for
${VERS_DEF}
# in get-addon-kernel-c99flags-for
${BUILD_CPPFLAGS}
)
target_include_directories(${addon_target}_C99_KERNEL_ADDON
BEFORE
PRIVATE
# in get-noopt-cflags-for
${CINFLAGS}
# in get-addon-kernel-c99flags-for
${CADDONINCFLAGS}
)
if(THREADING_MODEL STREQUAL "openmp")
# Equivalent to CTHREADFLAGS in get-noopt-cflags-for
target_link_libraries(${addon_target}_C99_KERNEL_ADDON PRIVATE OpenMP::OpenMP_C)
elseif(THREADING_MODEL STREQUAL "pthreads")
# in get-noopt-cflags-for
target_compile_options(${addon_target}_C99_KERNEL_ADDON PRIVATE ${CTHREADFLAGS})
endif()
# Equivalent to CPICFLAGS in get-noopt-cflags-for
set_target_properties(${addon_target}_C99_KERNEL_ADDON PROPERTIES POSITION_INDEPENDENT_CODE ON)
add_dependencies(${addon_target}_C99_KERNEL_ADDON flat-header)
# Put all those targets under object-libs-targets folder name so that they appear all together in IDE.
set_target_properties(${addon_target}_C99_KERNEL_ADDON PROPERTIES FOLDER object-libs-targets)
endif()
# Note: C++ files (JIT code) are not collected here.
# The main CMakeLists.txt already filters out aocl_gemm addon for compilers
# that don't support BF16 intrinsics (GCC < 11.2, Clang < 12.0).
# For supported compilers, we only use C files with intrinsics, not JIT.
set(LOCAL_SOURCE_CXX_FILES "")
# Only generate the object library if there is at least one source file.
list(LENGTH LOCAL_SOURCE_CXX_FILES size)
if(size GREATER 0)
# Create an object library using the source file list above.
add_library(${addon_target}_CXX_ADDON
OBJECT
${LOCAL_SOURCE_CXX_FILES}
)
# Use PRIVATE keyword for option setting since we do not want the properties to propagate in other targets.
# mimicing get-addon-cxxflags-for
target_compile_options(${addon_target}_CXX_ADDON
PRIVATE
# load-var-for,COPTFLAGS
${COPTFLAGS}
# get-noopt-cxxflags-for
${CDBGFLAGS}
# get-noopt-cxxflags-for
${CWARNFLAGS}
# get-noopt-cxxflags-for
${CMISCFLAGS}
# get-noopt-cxxflags-for
${CXXLANGFLAGS}
# in get-addon-cxxflags-for
${BUILD_SYMFLAGS}
)
target_compile_definitions(${addon_target}_CXX_ADDON
PRIVATE
# in get-noopt-cflags-for
${CPPROCFLAGS}
# in get-noopt-cflags-for
${VERS_DEF}
# in get-addon-cxxflags-for
${BUILD_CPPFLAGS}
)
target_include_directories(${addon_target}_CXX_ADDON
BEFORE
PRIVATE
# in get-noopt-cflags-for
${CINFLAGS}
# in get-addon-cxxflags-for
${CADDONINCFLAGS}
)
if(THREADING_MODEL STREQUAL "openmp")
# Equivalent to CTHREADFLAGS in get-noopt-cflags-for
target_link_libraries(${addon_target}_CXX_ADDON PRIVATE OpenMP::OpenMP_C)
elseif(THREADING_MODEL STREQUAL "pthreads")
# in get-noopt-cflags-for
target_compile_options(${addon_target}_CXX_ADDON PRIVATE ${CTHREADFLAGS})
endif()
# Equivalent to CPICFLAGS in get-noopt-cflags-for
set_target_properties(${addon_target}_CXX_ADDON PROPERTIES POSITION_INDEPENDENT_CODE ON)
add_dependencies(${addon_target}_CXX_ADDON flat-header)
# Put all those targets under object-libs-targets folder name so that they appear all together in IDE.
set_target_properties(${addon_target}_CXX_ADDON PROPERTIES FOLDER object-libs-targets)
endif()
endfunction()
# Generate targets for each of the addons.
foreach(ADDON ${ENABLE_ADDON})
generate_addon_targets(${ADDON})
endforeach()