Fix flash attention long argument for mainloine compatibility

This commit is contained in:
Kawrakow
2025-11-13 19:22:16 +02:00
parent ce3ce97a29
commit 22c20fcd6d

View File

@@ -1135,7 +1135,7 @@ bool gpt_params_find_arg(int argc, char ** argv, const std::string & arg, gpt_pa
params.flash_attn = false;
return true;
}
if (arg == "-fa" || arg == "--flash-attention") {
if (arg == "-fa" || arg == "--flash-attn") {
CHECK_ARG
std::string next_arg{argv[i]};
for (auto& c : next_arg) c = std::tolower(c);