mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-11 17:00:18 +00:00
* add a prototype of int4 * clean * debug * clean * clean * move packed into dynamic_buffer * fixed coord reset * add fast pki4 to half conversion * fix * fixed reference and host_tensor * fixed tensor init * format * debug i4_to_f16_convert * format * fixed splitk * weight permute * add b tile permute * clean * weight permute with splitki * format * improve weight layout * add and_or_b32 * fixed splitk crush * add permute switch as a template * recover v3r1 * clean * failure with intrawave v2 * fixed * fixed * add ckProfiler * add bfp16 support * add bf16 example * fixed int4 to bhalf_t conversion * format * fixed int4 to bf16 conversion * clean * add instances for mem * clean * fixed host tensor size * fixed * debug * fixed * add pk_i4_t as a struct * fix * Update example/01_gemm/gemm_xdl_bf16_pk_i4_v3.cpp Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com> * Update example/01_gemm/gemm_xdl_bf16_pk_i4_v3.cpp Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com> * Update example/01_gemm/gemm_xdl_bf16_pk_i4_v3.cpp Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com> * revert * Update example/01_gemm/gemm_xdl_bf16_pk_i4_v3.cpp Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com> * Update example/01_gemm/gemm_xdl_fp16_pk_i4_v3.cpp Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com> * Update example/01_gemm/gemm_xdl_fp16_pk_i4_v3.cpp Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com> * Update example/01_gemm/gemm_xdl_fp16_pk_i4_v3.cpp Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com> * Update example/01_gemm/gemm_xdl_fp16_pk_i4_v3.cpp Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com> * fixed comments * revert * clean * revert * revert * fixed * Update CMakeLists.txt * Update script/cmake-ck-dev.sh Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com> * Update include/ck/tensor_operation/gpu/element/unary_element_wise_operation.hpp Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com> * Update CMakeLists.txt Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com> * fixed * fixed * fixed * revert * revert * add comments * format * fixed assert * fixed * Fix I4 define in ckProfiler * Fixed example_gemm_xdl_bf16_pk_i4_v3 test failed issue --------- Co-authored-by: Jing Zhang <jizhan@fb.com> Co-authored-by: zjing14 <zhangjing14@gmail.com> Co-authored-by: mtgu0705 <mtgu@amd.com>
117 lines
4.3 KiB
CMake
117 lines
4.3 KiB
CMake
################################################################################
|
|
#
|
|
# MIT License
|
|
#
|
|
# Copyright (c) 2017-2024 Advanced Micro Devices, Inc.
|
|
#
|
|
# Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
# of this software and associated documentation files (the "Software"), to deal
|
|
# in the Software without restriction, including without limitation the rights
|
|
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
# copies of the Software, and to permit persons to whom the Software is
|
|
# furnished to do so, subject to the following conditions:
|
|
#
|
|
# The above copyright notice and this permission notice shall be included in all
|
|
# copies or substantial portions of the Software.
|
|
#
|
|
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
# SOFTWARE.
|
|
#
|
|
################################################################################
|
|
# - Enable warning all for gcc/clang or use /W4 for visual studio
|
|
|
|
## Strict warning level
|
|
if (MSVC)
|
|
# Use the highest warning level for visual studio.
|
|
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} /w")
|
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /w")
|
|
# set(CMAKE_CXX_WARNING_LEVEL 4)
|
|
# if (CMAKE_CXX_FLAGS MATCHES "/W[0-4]")
|
|
# string(REGEX REPLACE "/W[0-4]" "/W4" CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS}")
|
|
# else ()
|
|
# set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} /W4")
|
|
# endif ()
|
|
|
|
# set(CMAKE_C_WARNING_LEVEL 4)
|
|
# if (CMAKE_C_FLAGS MATCHES "/W[0-4]")
|
|
# string(REGEX REPLACE "/W[0-4]" "/W4" CMAKE_C_FLAGS "${CMAKE_C_FLAGS}")
|
|
# else ()
|
|
# set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /W4")
|
|
# endif ()
|
|
|
|
else()
|
|
foreach(COMPILER C CXX)
|
|
set(CMAKE_COMPILER_WARNINGS)
|
|
# use -Wall for gcc and clang
|
|
list(APPEND CMAKE_COMPILER_WARNINGS
|
|
-Wall
|
|
-Wextra
|
|
-Wcomment
|
|
-Wendif-labels
|
|
-Wformat
|
|
-Winit-self
|
|
-Wreturn-type
|
|
-Wsequence-point
|
|
# Shadow is broken on gcc when using lambdas
|
|
# -Wshadow
|
|
-Wswitch
|
|
-Wtrigraphs
|
|
-Wundef
|
|
-Wuninitialized
|
|
-Wunreachable-code
|
|
-Wunused
|
|
-Wno-reserved-identifier
|
|
-Werror
|
|
-Wno-option-ignored
|
|
-Wsign-compare
|
|
-Wno-extra-semi-stmt
|
|
-Wno-unused-template
|
|
)
|
|
if (CMAKE_${COMPILER}_COMPILER_ID MATCHES "Clang")
|
|
list(APPEND CMAKE_COMPILER_WARNINGS
|
|
-Weverything
|
|
-Wno-c++98-compat
|
|
-Wno-c++98-compat-pedantic
|
|
-Wno-conversion
|
|
-Wno-double-promotion
|
|
-Wno-exit-time-destructors
|
|
-Wno-extra-semi
|
|
-Wno-float-conversion
|
|
-Wno-gnu-anonymous-struct
|
|
-Wno-gnu-zero-variadic-macro-arguments
|
|
-Wno-missing-prototypes
|
|
-Wno-nested-anon-types
|
|
-Wno-padded
|
|
-Wno-return-std-move-in-c++11
|
|
-Wno-shorten-64-to-32
|
|
-Wno-sign-conversion
|
|
-Wno-unknown-warning-option
|
|
-Wno-unused-command-line-argument
|
|
-Wno-weak-vtables
|
|
-Wno-covered-switch-default
|
|
-Wno-unsafe-buffer-usage
|
|
-Wno-unused-lambda-capture
|
|
-Wno-nvcc-compat
|
|
)
|
|
else()
|
|
if (CMAKE_${COMPILER}_COMPILER_ID MATCHES "GNU" AND ${COMPILER} MATCHES "CXX")
|
|
# cmake 3.5.2 does not support >=.
|
|
if(NOT CMAKE_CXX_COMPILER_VERSION VERSION_LESS "6.1")
|
|
list(APPEND CMAKE_COMPILER_WARNINGS
|
|
-Wno-ignored-attributes)
|
|
endif()
|
|
endif()
|
|
list(APPEND CMAKE_COMPILER_WARNINGS
|
|
-Wno-missing-field-initializers
|
|
-Wno-deprecated-declarations
|
|
)
|
|
endif()
|
|
add_definitions(${CMAKE_COMPILER_WARNINGS})
|
|
endforeach()
|
|
endif ()
|