mirror of
https://github.com/turboderp-org/exllamav2.git
synced 2026-04-20 14:29:28 +00:00
Kernel optimizations WIP
This commit is contained in:
@@ -52,7 +52,7 @@ if args.prompt:
|
||||
|
||||
print(f" -- Warmup...")
|
||||
|
||||
model.forward(ids[:, :])
|
||||
model.forward(ids[:, -1:])
|
||||
|
||||
print(f" -- Generating (greedy sampling)...")
|
||||
print()
|
||||
|
||||
Reference in New Issue
Block a user