Embeddings: Add model management

Embedding models are managed on a separate backend, but are run in parallel with the model itself. Therefore, manage this in a separate container with separate routes. Signed-off-by: kingbri <bdashore3@proton.me>
2026-03-14 15:57:27 +00:00 · 2024-07-30 15:19:27 -04:00
parent f13d0fb8b3
commit bfa011e0ce
6 changed files with 135 additions and 19 deletions
--- a/main.py
+++ b/main.py
@@ -90,14 +90,17 @@ async def entrypoint_async():
    # If an initial embedding model name is specified, create a separate container
    # and load the model
    embedding_config = config.embeddings_config()
-    embedding_model_name = embedding_config.get("embeddings_model_name")
+    embedding_model_name = embedding_config.get("embedding_model_name")
    if embedding_model_name:
        embedding_model_path = pathlib.Path(
-            unwrap(embedding_config.get("embeddings_model_dir"), "models")
+            unwrap(embedding_config.get("embedding_model_dir"), "models")
        )
        embedding_model_path = embedding_model_path / embedding_model_name

-        await model.load_embeddings_model(embedding_model_path, **embedding_config)
+        try:
+            await model.load_embedding_model(embedding_model_path, **embedding_config)
+        except ImportError as ex:
+            logger.error(ex.msg)

    await start_api(host, port)