mirror of
https://github.com/theroyallab/tabbyAPI.git
synced 2026-04-29 10:42:03 +00:00
Config: Remove developer arg cuda_malloc_backend
* cudaMallocAsync is now enabled by default on supported configurations
This commit is contained in:
@@ -419,9 +419,6 @@ class DeveloperConfig(BaseConfigModel):
|
|||||||
disable_request_streaming: Optional[bool] = Field(
|
disable_request_streaming: Optional[bool] = Field(
|
||||||
False, description=("Disable API request streaming (default: False).")
|
False, description=("Disable API request streaming (default: False).")
|
||||||
)
|
)
|
||||||
cuda_malloc_backend: Optional[bool] = Field(
|
|
||||||
False, description=("Enable the torch CUDA malloc backend (default: False).")
|
|
||||||
)
|
|
||||||
realtime_process_priority: Optional[bool] = Field(
|
realtime_process_priority: Optional[bool] = Field(
|
||||||
False,
|
False,
|
||||||
description=(
|
description=(
|
||||||
|
|||||||
@@ -216,9 +216,6 @@ developer:
|
|||||||
# Disable API request streaming (default: False).
|
# Disable API request streaming (default: False).
|
||||||
disable_request_streaming: false
|
disable_request_streaming: false
|
||||||
|
|
||||||
# Enable the torch CUDA malloc backend (default: False).
|
|
||||||
cuda_malloc_backend: false
|
|
||||||
|
|
||||||
# Set process to use a higher priority.
|
# Set process to use a higher priority.
|
||||||
# For realtime process priority, run as administrator or sudo.
|
# For realtime process priority, run as administrator or sudo.
|
||||||
# Otherwise, the priority will be set to high.
|
# Otherwise, the priority will be set to high.
|
||||||
|
|||||||
Reference in New Issue
Block a user