add cache
This commit is contained in:
parent
8eebc192e0
commit
3a38099749
@ -2,6 +2,7 @@ from fastapi import FastAPI
|
||||
from fastapi import HTTPException
|
||||
import uvicorn
|
||||
from pydantic import BaseModel
|
||||
import torch
|
||||
|
||||
from models.embedder_gemma import TextEmbedderGemma
|
||||
from models.embedder_gemma_train import TextEmbedderGemmaTrain
|
||||
@ -52,4 +53,6 @@ def embed_gemma(request: EmbedRequest):
|
||||
else:
|
||||
raise HTTPException(status_code=400, detail="Invalid model")
|
||||
|
||||
torch.cuda.empty_cache()
|
||||
|
||||
return {"data": [{"embedding": emb.tolist()} for emb in embeddings]}
|
||||
Loading…
x
Reference in New Issue
Block a user