diff --git a/OAI/types/completions.py b/OAI/types/completion.py similarity index 97% rename from OAI/types/completions.py rename to OAI/types/completion.py index ffe84c7..813877c 100644 --- a/OAI/types/completions.py +++ b/OAI/types/completion.py @@ -35,10 +35,10 @@ class CompletionRequest(BaseModel): max_tokens: Optional[int] = 150 # Not supported sampling params - presence_penalty: Optional[int] = 0 + presence_penalty: Optional[float] = 0.0 # Aliased to repetition_penalty - frequency_penalty: int = 0 + frequency_penalty: Optional[float] = 0.0 # Sampling params token_healing: Optional[bool] = False diff --git a/OAI/utils.py b/OAI/utils.py index c889605..f6f70a0 100644 --- a/OAI/utils.py +++ b/OAI/utils.py @@ -1,5 +1,5 @@ import pathlib -from OAI.types.completions import CompletionResponse, CompletionRespChoice +from OAI.types.completion import CompletionResponse, CompletionRespChoice from OAI.types.common import UsageStats from OAI.types.model import ModelList, ModelCard from typing import Optional diff --git a/main.py b/main.py index 607922a..73bf0de 100644 --- a/main.py +++ b/main.py @@ -6,7 +6,7 @@ from fastapi import FastAPI, Request, HTTPException, Depends from model import ModelContainer from progress.bar import IncrementalBar from sse_starlette import EventSourceResponse -from OAI.types.completions import CompletionRequest +from OAI.types.completion import CompletionRequest from OAI.types.model import ModelCard, ModelLoadRequest, ModelLoadResponse from OAI.types.token import TokenEncodeRequest, TokenEncodeResponse, TokenDecodeRequest, TokenDecodeResponse from OAI.utils import create_completion_response, get_model_list