mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2026-03-14 18:37:23 +00:00
* [feat]: init amd adaption * [feat]: add blis support * [fix]: fix setup and moe kernel warpper * [fix](setup.py): support rebuild with cache and import kt_kernel works fine * [feat]: add moe_kernel converter for amd and implement the load method(haven't tested yet) * [feat](moe_kernel/moe.hpp): delete unused memory when using save * [fix](moe_kernel): update PLAIN for pack * [fix](moe_kernel): rm printf debug * [fix](moe_kernel): skip gpu experts * [fix](moe_kernel/moe.hpp): update include memory path * [feat](moe_kernel/moe.hpp): support expert deferral * [feat]: finish amd --------- Co-authored-by: mrhaoxx <mr.haoxx@gmail.com>
62 lines
1.5 KiB
JSON
62 lines
1.5 KiB
JSON
{
|
|
"version": 3,
|
|
"cmakeMinimumRequired": {
|
|
"major": 3,
|
|
"minor": 19,
|
|
"patch": 0
|
|
},
|
|
"configurePresets": [
|
|
{
|
|
"name": "avx512",
|
|
"displayName": "avx512_platform",
|
|
"description": "for avx512 platform",
|
|
"cacheVariables": {
|
|
"KTRANSFORMERS_CPU_USE_AMX": "OFF",
|
|
"LLAMA_AVX512": "OFF",
|
|
"LLAMA_AVX2": "OFF",
|
|
"KTRANSFORMERS_CPU_USE_AMX_AVX512": "ON",
|
|
"KTRANSFORMERS_USE_CUDA": "ON"
|
|
}
|
|
},
|
|
{
|
|
"name": "avx",
|
|
"displayName": "avx_platform",
|
|
"description": "for avx platform",
|
|
"cacheVariables": {
|
|
"KTRANSFORMERS_CPU_USE_AMX": "OFF",
|
|
"LLAMA_AVX2": "ON",
|
|
"KTRANSFORMERS_USE_CUDA": "ON"
|
|
}
|
|
},
|
|
{
|
|
"name": "amx",
|
|
"displayName": "amx_platform",
|
|
"description": "for amx platform",
|
|
"cacheVariables": {
|
|
"KTRANSFORMERS_CPU_USE_AMX": "ON",
|
|
"LLAMA_AVX512": "OFF",
|
|
"LLAMA_AVX2": "OFF",
|
|
"KTRANSFORMERS_CPU_USE_AMX_AVX512": "ON",
|
|
"KTRANSFORMERS_USE_CUDA": "ON"
|
|
}
|
|
},
|
|
{
|
|
"name": "amd",
|
|
"displayName": "amd_platform",
|
|
"description": "for amd platform",
|
|
"cacheVariables": {
|
|
"KTRANSFORMERS_CPU_USE_AMX": "OFF",
|
|
"LLAMA_AVX512": "OFF",
|
|
"LLAMA_AVX2": "ON",
|
|
"KTRANSFORMERS_CPU_USE_AMX_AVX512": "OFF",
|
|
"KTRANSFORMERS_USE_CUDA": "ON",
|
|
"KTRANSFORMERS_CPU_MOE_AMD": "ON",
|
|
"KTRANSFORMERS_CPU_MOE_KERNEL": "ON"
|
|
}
|
|
}
|
|
|
|
]
|
|
}
|
|
|
|
|