Remove autoregressive and chunking

2026-03-09 13:30:17 +00:00 · 2026-02-28 13:21:19 +00:00
parent de88fa04b7
commit b845b0612c
7 changed files with 6 additions and 353 deletions
--- a/include/llama.h
+++ b/include/llama.h
@@ -456,7 +456,6 @@ extern "C" {
        bool split_mode_graph_scheduling; // if true, force split mode graph scheduling
        //bool split_mode_f16;    // if true, cast intermediate results to f16 before copying to other GPUs
        bool scheduler_async;   // if true, with split mode "graph" graph evaluation will be done using multiple threads
-        int  fused_delta_net;
        bool mtp;   // Activate MTP if supported
        enum llama_mtp_op_type mtp_op_type;