Change default FA offset to ln(2) (#1235)

* Change default FA offset to ln(2)

* Also here
This commit is contained in:
Kawrakow
2026-02-05 13:42:53 +02:00
committed by GitHub
parent 9c1c74acda
commit a7befb3bed
2 changed files with 2 additions and 2 deletions

View File

@@ -4536,7 +4536,7 @@ struct cuda_params {
int fusion = GGML_CUDA_FUSION;
int offload_batch_size = GGML_CUDA_MIN_BATCH_OFFLOAD;
int mmq_id_thresh = 32;
float fa_offset = 0;
float fa_offset = 0.6931f;
#ifdef USE_CUDA_GRAPH
bool use_cuda_graph = true;
#else

View File

@@ -853,7 +853,7 @@ struct ggml_backend_cuda_context {
int fusion = GGML_CUDA_FUSION;
int offload_batch_size = GGML_CUDA_MIN_BATCH_OFFLOAD;
int mmq_id_thresh = 32;
float fa_offset = 0.0f;
float fa_offset = 0.6931f; // ln(2)
#ifdef USE_CUDA_GRAPH
bool use_cuda_graph = true;