From cfe137b308ee2d63af6f61879d4833cb92116a56 Mon Sep 17 00:00:00 2001 From: turboderp <11859846+turboderp@users.noreply.github.com> Date: Fri, 24 Apr 2026 02:55:00 +0200 Subject: [PATCH] GatedDeltaNet: Fix rewind logic --- exllamav3/modules/gated_delta_net.py | 1 + 1 file changed, 1 insertion(+) diff --git a/exllamav3/modules/gated_delta_net.py b/exllamav3/modules/gated_delta_net.py index 18d60e4..4551210 100644 --- a/exllamav3/modules/gated_delta_net.py +++ b/exllamav3/modules/gated_delta_net.py @@ -285,6 +285,7 @@ class GDN_RecurrentState(CacheableState): self.last_recurrent_state[0].copy_(self.history[0, -count]) cdim = self.last_conv_state.shape[-1] self.last_conv_state[0].copy_(self.conv_history[0, :, -count - cdim : -count]) + self.position -= count class GatedDeltaNet(Module):