mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-02-07 23:10:10 +00:00
Change default FA offset to ln(2) (#1235)
* Change default FA offset to ln(2) * Also here
This commit is contained in:
@@ -4536,7 +4536,7 @@ struct cuda_params {
|
||||
int fusion = GGML_CUDA_FUSION;
|
||||
int offload_batch_size = GGML_CUDA_MIN_BATCH_OFFLOAD;
|
||||
int mmq_id_thresh = 32;
|
||||
float fa_offset = 0;
|
||||
float fa_offset = 0.6931f;
|
||||
#ifdef USE_CUDA_GRAPH
|
||||
bool use_cuda_graph = true;
|
||||
#else
|
||||
|
||||
@@ -853,7 +853,7 @@ struct ggml_backend_cuda_context {
|
||||
int fusion = GGML_CUDA_FUSION;
|
||||
int offload_batch_size = GGML_CUDA_MIN_BATCH_OFFLOAD;
|
||||
int mmq_id_thresh = 32;
|
||||
float fa_offset = 0.0f;
|
||||
float fa_offset = 0.6931f; // ln(2)
|
||||
#ifdef USE_CUDA_GRAPH
|
||||
bool use_cuda_graph = true;
|
||||
|
||||
|
||||
Reference in New Issue
Block a user