robinroy03's picture
Extended to 5 gunicorn workers, fixed embedding endpoint
e5e8307
raw
history blame
No virus
645 Bytes
from flask import Flask
from flask import request
from sentence_transformers import SentenceTransformer
import os
app = Flask(__name__)
os.environ["TRANSFORMERS_CACHE"] = "/.cache"
model = SentenceTransformer('Alibaba-NLP/gte-large-en-v1.5', trust_remote_code=True)
@app.route("/embedding", methods=['POST'])
def embedding():
"""
{
text: <text>
}
"""
message = request.get_json()
message = model.encode(message)
return {"output":model.encode(message['text'].tolist())}
# curl -v -X POST 'http://127.0.0.1:8000/completion' --header 'Content-Type: application/json' --data '{"text": "what is an apple?"}'