| import sys |
| import os |
| import copy |
| import uvicorn |
| import socket |
| import logging |
| import datetime |
| from models.quotes_search_engine import QuoteSearchEngine |
| from models.data_reader import load_quotes_from_csv |
| from models.Query import Query, Query_Multiple, SearchResponse, SimilarQuote, QuoteVector, VectorResponse |
| from decouple import config |
| from fastapi import FastAPI, HTTPException, Depends, Body |
| from sentence_transformers import SentenceTransformer |
|
|
|
|
|
|
| |
| quotes_path = "hf://datasets/jstet/quotes-500k/quotes.csv" |
|
|
|
|
| app = FastAPI(title="Search Prompt Engine", description="API for prompt search", version="1.0") |
|
|
| quotes = load_quotes_from_csv(quotes_path) |
| search_engine = QuoteSearchEngine() |
| search_engine.add_quotes_to_vector_database(quotes[:10000]) |
|
|
| @app.get("/") |
| def read_root(): |
| return {"message": "Quote Search Engine is running!"} |
|
|
| @app.post("/search/") |
| async def search_prompts(query: Query, k: int = 3): |
| print(f'Prompt: {query}') |
| similar_quotes, distances = search_engine.most_similar(query.quote, top_k=k) |
| print(f'Similar Quotes: {similar_quotes}') |
| print(f'Cosine similarity: {distances}') |
| print(40*'****') |
| |
| response = [ |
| SimilarQuote(prompt=prompt, distance=float(distance)) |
| for prompt, distance in zip(similar_quotes, distances) |
| ] |
| |
| return SearchResponse(results=response) |
|
|
| @app.post("/all_vectors_similarities/") |
| async def all_vectors(query: Query): |
|
|
| query_embedding = search_engine.model.encode([query.quote]) |
| all_similarities = search_engine.cosine_similarity(query_embedding, search_engine.index) |
| print(f'Quote or phrase: {query}') |
| print(f'All Vector Similarities: {all_similarities}') |
| print(40*'****') |
| response = [ |
| QuoteVector(vector=index, distance=float(distance)) |
| for index, distance in enumerate(all_similarities) |
| ] |
| return VectorResponse(results=response) |
|
|
| if __name__ == "__main__": |
| |
| |
| SERVER_HOST_IP = socket.gethostbyname("localhost") |
| SERVER_PORT = int(8084) |
| uvicorn.run(app, host=SERVER_HOST_IP, port=SERVER_PORT) |