|
|
import sys |
|
|
import os |
|
|
import copy |
|
|
import uvicorn |
|
|
import socket |
|
|
import logging |
|
|
import datetime |
|
|
from models.quotes_search_engine import QuoteSearchEngine |
|
|
from models.data_reader import load_quotes_from_csv |
|
|
from models.Query import Query, Query_Multiple, SearchResponse, SimilarQuote, QuoteVector, VectorResponse |
|
|
from decouple import config |
|
|
from fastapi import FastAPI, HTTPException, Depends, Body |
|
|
from sentence_transformers import SentenceTransformer |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
quotes_path = "hf://datasets/jstet/quotes-500k/quotes.csv" |
|
|
|
|
|
|
|
|
app = FastAPI(title="Search Prompt Engine", description="API for prompt search", version="1.0") |
|
|
|
|
|
quotes = load_quotes_from_csv(quotes_path) |
|
|
search_engine = QuoteSearchEngine() |
|
|
search_engine.add_quotes_to_vector_database(quotes[:10000]) |
|
|
|
|
|
@app.get("/") |
|
|
def read_root(): |
|
|
return {"message": "Quote Search Engine is running!"} |
|
|
|
|
|
@app.post("/search/") |
|
|
async def search_prompts(query: Query, k: int = 3): |
|
|
print(f'Prompt: {query}') |
|
|
similar_quotes, distances = search_engine.most_similar(query.quote, top_k=k) |
|
|
print(f'Similar Quotes: {similar_quotes}') |
|
|
print(f'Cosine similarity: {distances}') |
|
|
print(40*'****') |
|
|
|
|
|
response = [ |
|
|
SimilarQuote(prompt=prompt, distance=float(distance)) |
|
|
for prompt, distance in zip(similar_quotes, distances) |
|
|
] |
|
|
|
|
|
return SearchResponse(results=response) |
|
|
|
|
|
@app.post("/all_vectors_similarities/") |
|
|
async def all_vectors(query: Query): |
|
|
|
|
|
query_embedding = search_engine.model.encode([query.quote]) |
|
|
all_similarities = search_engine.cosine_similarity(query_embedding, search_engine.index) |
|
|
print(f'Quote or phrase: {query}') |
|
|
print(f'All Vector Similarities: {all_similarities}') |
|
|
print(40*'****') |
|
|
response = [ |
|
|
QuoteVector(vector=index, distance=float(distance)) |
|
|
for index, distance in enumerate(all_similarities) |
|
|
] |
|
|
return VectorResponse(results=response) |
|
|
|
|
|
if __name__ == "__main__": |
|
|
|
|
|
|
|
|
SERVER_HOST_IP = socket.gethostbyname("localhost") |
|
|
SERVER_PORT = int(8084) |
|
|
uvicorn.run(app, host=SERVER_HOST_IP, port=SERVER_PORT) |