cache faster
Browse files
App/Embedding/utils/Initialize.py
CHANGED
|
@@ -11,6 +11,7 @@ from .Elastic import FetchDocuments
|
|
| 11 |
index_name = "movie-recommender-fast"
|
| 12 |
model_name = "thenlper/gte-base"
|
| 13 |
embeddings = HuggingFaceEmbeddings(model_name=model_name)
|
|
|
|
| 14 |
|
| 15 |
TMDB_API = os.environ.get("TMDB_API")
|
| 16 |
|
|
@@ -26,6 +27,7 @@ vector_index = pinecone.Index(index_name=index_name)
|
|
| 26 |
docsearch = Pinecone.from_existing_index(index_name, embeddings)
|
| 27 |
|
| 28 |
|
|
|
|
| 29 |
def check_if_exists(text, imdb_id):
|
| 30 |
results = docsearch.similarity_search(text, filter={"key": {"$eq": imdb_id}}, k=1)
|
| 31 |
if results:
|
|
@@ -34,6 +36,7 @@ def check_if_exists(text, imdb_id):
|
|
| 34 |
return False
|
| 35 |
|
| 36 |
|
|
|
|
| 37 |
def add_document(imdb_id, doc):
|
| 38 |
text, temp_doc = doc
|
| 39 |
response = check_if_exists(text=text, imdb_id=imdb_id)
|
|
@@ -51,12 +54,14 @@ def add_document(imdb_id, doc):
|
|
| 51 |
docsearch.add_documents([temp])
|
| 52 |
|
| 53 |
|
|
|
|
| 54 |
def generate_text(doc):
|
| 55 |
if doc["tv_results"]:
|
| 56 |
return pprint.pformat(doc["tv_results"][0]), doc["tv_results"][0]
|
| 57 |
return pprint.pformat(doc["movie_results"][0]), doc["movie_results"][0]
|
| 58 |
|
| 59 |
|
|
|
|
| 60 |
def IdSearch(query: str, background_task: BackgroundTasks):
|
| 61 |
doc = requests.get(
|
| 62 |
f"https://api.themoviedb.org/3/find/{query}?external_source=imdb_id&language=en&api_key={TMDB_API}"
|
|
@@ -70,6 +75,7 @@ def IdSearch(query: str, background_task: BackgroundTasks):
|
|
| 70 |
return TextSearch(text, filter={"key": {"$ne": query}})
|
| 71 |
|
| 72 |
|
|
|
|
| 73 |
def TextSearch(query: str, filter=None):
|
| 74 |
docs = docsearch.similarity_search(query, k=10, filter=filter)
|
| 75 |
keys = [doc.metadata["key"] for doc in docs]
|
|
|
|
| 11 |
index_name = "movie-recommender-fast"
|
| 12 |
model_name = "thenlper/gte-base"
|
| 13 |
embeddings = HuggingFaceEmbeddings(model_name=model_name)
|
| 14 |
+
from fastapi_cache.decorator import cache
|
| 15 |
|
| 16 |
TMDB_API = os.environ.get("TMDB_API")
|
| 17 |
|
|
|
|
| 27 |
docsearch = Pinecone.from_existing_index(index_name, embeddings)
|
| 28 |
|
| 29 |
|
| 30 |
+
@cache(namespace="test")
|
| 31 |
def check_if_exists(text, imdb_id):
|
| 32 |
results = docsearch.similarity_search(text, filter={"key": {"$eq": imdb_id}}, k=1)
|
| 33 |
if results:
|
|
|
|
| 36 |
return False
|
| 37 |
|
| 38 |
|
| 39 |
+
@cache(namespace="test")
|
| 40 |
def add_document(imdb_id, doc):
|
| 41 |
text, temp_doc = doc
|
| 42 |
response = check_if_exists(text=text, imdb_id=imdb_id)
|
|
|
|
| 54 |
docsearch.add_documents([temp])
|
| 55 |
|
| 56 |
|
| 57 |
+
@cache(namespace="test")
|
| 58 |
def generate_text(doc):
|
| 59 |
if doc["tv_results"]:
|
| 60 |
return pprint.pformat(doc["tv_results"][0]), doc["tv_results"][0]
|
| 61 |
return pprint.pformat(doc["movie_results"][0]), doc["movie_results"][0]
|
| 62 |
|
| 63 |
|
| 64 |
+
# @cache(namespace="test")
|
| 65 |
def IdSearch(query: str, background_task: BackgroundTasks):
|
| 66 |
doc = requests.get(
|
| 67 |
f"https://api.themoviedb.org/3/find/{query}?external_source=imdb_id&language=en&api_key={TMDB_API}"
|
|
|
|
| 75 |
return TextSearch(text, filter={"key": {"$ne": query}})
|
| 76 |
|
| 77 |
|
| 78 |
+
# @cache(namespace="test")
|
| 79 |
def TextSearch(query: str, filter=None):
|
| 80 |
docs = docsearch.similarity_search(query, k=10, filter=filter)
|
| 81 |
keys = [doc.metadata["key"] for doc in docs]
|