B FastembedServer: Switch to OpenAI api, support changing models
This commit is contained in:
parent
72ec261a69
commit
b9af017a4c
1 changed files with 7 additions and 5 deletions
|
@ -2,18 +2,20 @@ from fastembed import TextEmbedding
|
|||
from fastapi import FastAPI
|
||||
from pydantic import BaseModel
|
||||
|
||||
model = TextEmbedding("snowflake/snowflake-arctic-embed-xs")
|
||||
models = {}
|
||||
|
||||
app = FastAPI()
|
||||
|
||||
class EmbeddingRequest(BaseModel):
|
||||
model: str
|
||||
prompt: str
|
||||
input: str
|
||||
|
||||
@app.post("/api/embeddings")
|
||||
@app.post("/v1/embeddings")
|
||||
def embeddings(request: EmbeddingRequest):
|
||||
embeddings = next(model.embed(request.prompt)).tolist()
|
||||
return {"embedding": embeddings}
|
||||
model = models.get(request.model) or TextEmbedding(request.model)
|
||||
models[request.model] = model
|
||||
embeddings = next(model.embed(request.input)).tolist()
|
||||
return {"data": [{"embedding": embeddings}]}
|
||||
|
||||
if __name__ == "__main__":
|
||||
import uvicorn
|
||||
|
|
Loading…
Reference in a new issue