GatedDeltaNet: Fix rewind logic

This commit is contained in:
turboderp
2026-04-24 02:55:00 +02:00
parent 14a2cbff1d
commit cfe137b308

View File

@@ -285,6 +285,7 @@ class GDN_RecurrentState(CacheableState):
self.last_recurrent_state[0].copy_(self.history[0, -count])
cdim = self.last_conv_state.shape[-1]
self.last_conv_state[0].copy_(self.conv_history[0, :, -count - cdim : -count])
self.position -= count
class GatedDeltaNet(Module):