Add coqui model preload

This commit is contained in:
SillyLossy
2023-07-26 22:49:44 +03:00
parent 30a2424e8f
commit 9b1e3d1250
2 changed files with 4 additions and 0 deletions

View File

@@ -153,6 +153,7 @@ cd SillyTavern-extras
| `--cuda` | Uses CUDA (GPU+VRAM) to run modules if it is available. Otherwise, falls back to using CPU. |
| `--cuda-device` | Specifies a CUDA device to use. Defaults to `cuda:0` (first available GPU). |
| `--coqui-gpu` | Uses GPU for coqui TTS (if available). |
| `--coqui-model` | If provided, downloads and preloads a coqui TTS model. Default: none.<br>Example: `tts_models/multilingual/multi-dataset/bark` |
| `--summarization-model` | Load a custom summarization model.<br>Expects a HuggingFace model ID.<br>Default: [Qiliang/bart-large-cnn-samsum-ChatGPT_v3](https://huggingface.co/Qiliang/bart-large-cnn-samsum-ChatGPT_v3) |
| `--classification-model` | Load a custom sentiment classification model.<br>Expects a HuggingFace model ID.<br>Default (6 emotions): [nateraw/bert-base-uncased-emotion](https://huggingface.co/nateraw/bert-base-uncased-emotion)<br>Other solid option is (28 emotions): [joeddav/distilbert-base-uncased-go-emotions-student](https://huggingface.co/joeddav/distilbert-base-uncased-go-emotions-student)<br>For Chinese language: [touch20032003/xuyuan-trial-sentiment-bert-chinese](https://huggingface.co/touch20032003/xuyuan-trial-sentiment-bert-chinese) |
| `--captioning-model` | Load a custom captioning model.<br>Expects a HuggingFace model ID.<br>Default: [Salesforce/blip-image-captioning-large](https://huggingface.co/Salesforce/blip-image-captioning-large) |

View File

@@ -83,6 +83,7 @@ parser.add_argument(
"--secure", action="store_true", help="Enforces the use of an API key"
)
parser.add_argument("--coqui-gpu", action="store_false", help="Run the voice models on the GPU (CPU is default)")
parser.add_argument("--coqui-model", help="Load a custom Coqui TTS model")
sd_group = parser.add_mutually_exclusive_group()
local_sd = sd_group.add_argument_group("sd-local")
@@ -253,6 +254,8 @@ if "coqui-tts" in modules:
print("Initializing Coqui TTS client in " + mode + " mode")
import tts_coqui as coqui
from tts_coqui import *
if args.coqui_model is not None:
coqui.coqui_modeldownload(args.coqui_model)
if "edge-tts" in modules:
print("Initializing Edge TTS client")