Zen4 Flash Attnetion: WIP bf16

This commit is contained in:
Iwan Kawrakow
2024-09-04 13:09:24 +03:00
parent f17d0d72f5
commit 8218e77dec
3 changed files with 385 additions and 1 deletions

View File

@@ -2221,6 +2221,9 @@ static ggml_type kv_cache_type_from_str(const std::string & s) {
if (s == "f16") {
return GGML_TYPE_F16;
}
if (s == "bf16") {
return GGML_TYPE_BF16;
}
if (s == "q8_0") {
return GGML_TYPE_Q8_0;
}