Merge branch 'neo'

2026-04-23 16:08:57 +00:00 · 2023-09-03 16:45:43 +03:00
parent aac582a957 60045b599f
commit a559511ebf
2 changed files with 7 additions and 25 deletions
--- a/modules/classify/classify_module.py
+++ b/modules/classify/classify_module.py
@@ -3,26 +3,23 @@ Classify module for SillyTavern Extras

 Authors:
    - Tony Ribeiro (https://github.com/Tony-sama)
+    - Cohee (https://github.com/Cohee1207)

 Provides classification features for text

 References:
+    - https://huggingface.co/tasks/text-classification
 """

-import torch
 from transformers import pipeline

 DEBUG_PREFIX = "<Classify module>"

 # Models init
-cuda_device = "cuda:0"# if not args.cuda_device else args.cuda_device
-device_string = cuda_device if torch.cuda.is_available() else 'cpu'
-device = torch.device(device_string)
-torch_dtype = torch.float32 if device_string != cuda_device  else torch.float16

 text_emotion_pipe = None

-def init_text_emotion_classifier(model_name: str) -> None:
+def init_text_emotion_classifier(model_name: str, device: str, torch_dtype: str) -> None:
    global text_emotion_pipe

    print(DEBUG_PREFIX,"Initializing text classification pipeline with model",model_name)
@@ -41,4 +38,4 @@ def classify_text_emotion(text: str) -> list:
        truncation=True,
        max_length=text_emotion_pipe.model.config.max_position_embeddings,
    )[0]
-    return sorted(output, key=lambda x: x["score"], reverse=True)
+    return sorted(output, key=lambda x: x["score"], reverse=True)
--- a/server.py
+++ b/server.py
@@ -327,19 +327,9 @@ if max_content_length is not None:
    print("Setting MAX_CONTENT_LENGTH to",max_content_length,"Mb")
    app.config["MAX_CONTENT_LENGTH"] = int(max_content_length) * 1024 * 1024

-# TODO: Keij, unify main classify and module one
 if "classify" in modules:
-    print("Initializing a sentiment classification pipeline...")
-    classification_pipe = pipeline(
-        "text-classification",
-        model=classification_model,
-        top_k=None,
-        device=device,
-        torch_dtype=torch_dtype,
-    )
-
    import modules.classify.classify_module as classify_module
-    classify_module.init_text_emotion_classifier(classification_model)
+    classify_module.init_text_emotion_classifier(classification_model, device, torch_dtype)

 if "vosk-stt" in modules:
    print("Initializing Vosk speech-recognition (from ST request file)")
@@ -407,7 +397,7 @@ if "coqui-tts" in modules:
    mode = "GPU" if args.coqui_gpu else "CPU"
    print("Initializing Coqui TTS client in " + mode + " mode")
    import modules.text_to_speech.coqui.coqui_module as coqui_module
-    
+
    if mode == "GPU":
        coqui_module.gpu_mode = True

@@ -448,12 +438,7 @@ def require_module(name):

 # AI stuff
 def classify_text(text: str) -> list:
-    output = classification_pipe(
-        text,
-        truncation=True,
-        max_length=classification_pipe.model.config.max_position_embeddings,
-    )[0]
-    return sorted(output, key=lambda x: x["score"], reverse=True)
+    return classify_module.classify_text_emotion(text)


 def caption_image(raw_image: Image, max_new_tokens: int = 20) -> str: