moraxgiga's picture
Update TextGen/router.py
36899d6 verified
raw
history blame contribute delete
No virus
983 Bytes
from pydantic import BaseModel
from fastapi.middleware.cors import CORSMiddleware
from transformers import AutoModel
from typing import List
import os, platform, time
# Your model loading and app initialization code
model = AutoModel.from_pretrained('jinaai/jina-embeddings-v2-base-en', trust_remote_code=True)
class Validation(BaseModel):
prompt: List[str]
from TextGen import app
app.add_middleware(
CORSMiddleware,
allow_origins=["*"],
allow_credentials=True,
allow_methods=["*"],
allow_headers=["*"],
)
@app.post("/api/generate", summary="Generate embeddings", tags=["Generate"])
def inference(item: Validation):
start_time = time.time()
embeddings = model.encode(item.prompt).tolist()
end_time = time.time()
time_taken = end_time - start_time # Calculate the time taken
return {
"embeddings": embeddings,
"time_taken": f"{time_taken:.2f} seconds",
"Number_of_sentence_processed": len(item.prompt)
}