mirror of
https://github.com/theroyallab/tabbyAPI.git
synced 2026-03-14 15:57:27 +00:00
Model: Fix no flash attention
Was being called wrong from config. Signed-off-by: kingbri <bdashore3@proton.me>
This commit is contained in:
2
model.py
2
model.py
@@ -94,7 +94,7 @@ class ModelContainer:
|
||||
)
|
||||
|
||||
# Turn off flash attention?
|
||||
self.config.no_flash_attn = unwrap(kwargs.get("no_flash_attn"), False)
|
||||
self.config.no_flash_attn = unwrap(kwargs.get("no_flash_attention"), False)
|
||||
|
||||
# low_mem is currently broken in exllamav2. Don't use it until it's fixed.
|
||||
"""
|
||||
|
||||
Reference in New Issue
Block a user