mirror of
https://github.com/theroyallab/tabbyAPI.git
synced 2026-03-14 15:57:27 +00:00
Merge pull request #254 from lucyknada/main
add draft_gpu_split option for spec decoding
This commit is contained in:
@@ -351,6 +351,13 @@ class DraftModelConfig(BaseConfigModel):
|
||||
f"Possible values: {str(CACHE_SIZES)[15:-1]}."
|
||||
),
|
||||
)
|
||||
draft_gpu_split: List[float] = Field(
|
||||
default_factory=list,
|
||||
description=(
|
||||
"An integer array of GBs of VRAM to split between GPUs (default: []).\n"
|
||||
"If this isn't filled in, the draft model is autosplit."
|
||||
),
|
||||
)
|
||||
|
||||
|
||||
class LoraInstanceModel(BaseConfigModel):
|
||||
|
||||
Reference in New Issue
Block a user