Is this better for multi-GPU and split mode "graph"?

2026-01-26 17:20:01 +00:00 · 2025-12-02 08:44:46 +00:00
parent a719349982
commit 49ec5726d7
1 changed files with 0 additions and 6 deletions
--- a/src/llama-build-context.cpp
+++ b/src/llama-build-context.cpp
@@ -688,12 +688,6 @@ ggml_tensor * llm_build_context::llm_build_ffn(
            cur = ggml_add(ctx, cur, ffn[id]);
            cb(cur, "combine_ffn", il);
        }
-        if (ffn.size() > 2) {
-            cur->op_params[0] = 0xff;
-        }
-        //if (cur->type != GGML_TYPE_F32) {
-        //    cur = ggml_cast(ctx, cur, GGML_TYPE_F32);
-        //}

        return cur;
    }