mirror of
https://github.com/theroyallab/tabbyAPI.git
synced 2026-04-28 10:11:39 +00:00
Embeddings: Switch to Infinity
Infinity-emb is an async batching engine for embeddings. This is preferable to sentence-transformers since it handles scalable usecases without the need for external thread intervention. Signed-off-by: kingbri <bdashore3@proton.me>
This commit is contained in:
@@ -135,6 +135,6 @@ async def chat_completion_request(
|
||||
dependencies=[Depends(check_api_key), Depends(check_model_container)],
|
||||
)
|
||||
async def handle_embeddings(data: EmbeddingsRequest) -> EmbeddingsResponse:
|
||||
response = await embeddings(data.input, data.encoding_format, data.model)
|
||||
response = await embeddings(data)
|
||||
|
||||
return response
|
||||
|
||||
Reference in New Issue
Block a user