Make /v1/embeddings functional, add request/response types

This commit is contained in:
oobabooga 2023-11-10 07:34:27 -08:00
parent 7ed2143cd6
commit c5be3f7acb
6 changed files with 40 additions and 26 deletions

View file

@ -154,6 +154,19 @@ class LoadModelRequest(BaseModel):
settings: dict | None = None
class EmbeddingsRequest(BaseModel):
input: str | List[str]
model: str | None = Field(default=None, description="Unused parameter. To change the model, set the OPENEDAI_EMBEDDING_MODEL and OPENEDAI_EMBEDDING_DEVICE environment variables before starting the server.")
encoding_format: str = Field(default="float", description="Can be float or base64.")
user: str | None = Field(default=None, description="Unused parameter.")
class EmbeddingsResponse(BaseModel):
index: int
embedding: List[float]
object: str = "embedding"
def to_json(obj):
return json.dumps(obj.__dict__, indent=4)