add cache
This commit is contained in:
parent
8eebc192e0
commit
3a38099749
@ -2,6 +2,7 @@ from fastapi import FastAPI
|
|||||||
from fastapi import HTTPException
|
from fastapi import HTTPException
|
||||||
import uvicorn
|
import uvicorn
|
||||||
from pydantic import BaseModel
|
from pydantic import BaseModel
|
||||||
|
import torch
|
||||||
|
|
||||||
from models.embedder_gemma import TextEmbedderGemma
|
from models.embedder_gemma import TextEmbedderGemma
|
||||||
from models.embedder_gemma_train import TextEmbedderGemmaTrain
|
from models.embedder_gemma_train import TextEmbedderGemmaTrain
|
||||||
@ -52,4 +53,6 @@ def embed_gemma(request: EmbedRequest):
|
|||||||
else:
|
else:
|
||||||
raise HTTPException(status_code=400, detail="Invalid model")
|
raise HTTPException(status_code=400, detail="Invalid model")
|
||||||
|
|
||||||
|
torch.cuda.empty_cache()
|
||||||
|
|
||||||
return {"data": [{"embedding": emb.tolist()} for emb in embeddings]}
|
return {"data": [{"embedding": emb.tolist()} for emb in embeddings]}
|
||||||
Loading…
x
Reference in New Issue
Block a user