From 5cb91c5505370e55bc20f3e90f519e7786cd508f Mon Sep 17 00:00:00 2001 From: turboderp <11859846+turboderp@users.noreply.github.com> Date: Mon, 2 Mar 2026 16:35:26 +0100 Subject: [PATCH] GatedDeltaNet: Fix output projection no. input features --- exllamav3/modules/gated_delta_net.py | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) diff --git a/exllamav3/modules/gated_delta_net.py b/exllamav3/modules/gated_delta_net.py index 5913fb8..29c325c 100644 --- a/exllamav3/modules/gated_delta_net.py +++ b/exllamav3/modules/gated_delta_net.py @@ -352,7 +352,14 @@ class GatedDeltaNet(Module): self.b_proj = None self.a_proj = None - self.o_proj = Linear(config, f"{key}.{key_o}", 2 * hidden_size, hidden_size, qmap = qmap + ".output", out_dtype = self.out_dtype) + self.o_proj = Linear( + config, + f"{key}.{key_o}", + self.v_head_dim * self.num_v_heads, + hidden_size, + qmap = qmap + ".output", + out_dtype = self.out_dtype + ) self.register_submodule(self.o_proj) self.norm = GatedRMSNorm(config, f"{key}.{key_norm}", self.rms_norm_eps, out_dtype = torch.half)