itertools.pairwise substitute for Python<3.10

2026-04-20 14:29:28 +00:00 · 2024-06-24 02:29:15 +02:00
parent 1552b06a7a
commit 0697196357
2 changed files with 14 additions and 2 deletions
--- a/exllamav2/compat.py
+++ b/exllamav2/compat.py
@@ -1,5 +1,16 @@
 from __future__ import annotations
 import torch
+import itertools
+
+# Emulate pairwise on Python <3.10
+
+try:
+    pairwise = itertools.pairwise
+except AttributeError:
+    def pairwise(iterable):
+        a, b = itertools.tee(iterable)
+        next(b, None)
+        return zip(a, b)

 # On some setups Torch will attempt to use GPU peer-to-peer copies even when they are not supported. This is either
 # a driver issue, a bug in Torch, or both. Either way, the result is that .to() will create an empty tensor on the
--- a/exllamav2/generator/dynamic.py
+++ b/exllamav2/generator/dynamic.py
@@ -8,6 +8,7 @@ from exllamav2.attn import ExLlamaV2Attention, assert_paged_attn
 from exllamav2.ext import exllamav2_ext as ext_c, none_tensor
 from concurrent.futures import ThreadPoolExecutor

+from exllamav2.compat import pairwise
 import torch
 import random
 import numpy as np
@@ -1331,7 +1332,7 @@ class ExLlamaV2DynamicGenerator:
            rotation = [r * self.page_size for r in rotation]
            for cache, buffer in zip(cache_tensors, defrag_buffers):
                buffer[:, :, :, :].copy_(cache[:, rotation[0] : rotation[0] + self.page_size, :, :])
-                for a, b in itertools.pairwise(rotation):
+                for a, b in pairwise(rotation):
                    cache[:, a : a + self.page_size, :, :].copy_(cache[:, b : b + self.page_size, :, :])
                cache[:, rotation[-1] : rotation[-1] + self.page_size, :, :].copy_(buffer[:, :, :, :])

@@ -2392,7 +2393,7 @@ class ExLlamaV2DynamicJob:
            # Metrics

            self.total_pages += len(seq.allocated_pages)
-            for page_a, page_b in itertools.pairwise(seq.allocated_pages):
+            for page_a, page_b in pairwise(seq.allocated_pages):
                if page_b.page_index != page_a.page_index + 1:
                    self.non_sequential_pages += 1