mirror of
https://github.com/theroyallab/tabbyAPI.git
synced 2026-04-22 15:28:56 +00:00
Model: Add tensor_parallel_backend option
This allows for users to use nccl or native depending on the GPU setup. NCCL is only available with Linux built wheels. Signed-off-by: kingbri <8082010+kingbri1@users.noreply.github.com>
This commit is contained in:
@@ -87,6 +87,12 @@ model:
|
||||
# This ignores the gpu_split_auto value.
|
||||
tensor_parallel: false
|
||||
|
||||
# Sets a backend type for tensor parallelism. (default: native).
|
||||
# Options: native, nccl
|
||||
# Native is recommended for PCIe GPUs
|
||||
# NCCL is recommended for NVLink.
|
||||
tensor_parallel_backend: native
|
||||
|
||||
# Automatically allocate resources to GPUs (default: True).
|
||||
# Not parsed for single GPU users.
|
||||
gpu_split_auto: true
|
||||
|
||||
Reference in New Issue
Block a user