add deletion of csv file and index created during a session
Browse files
app.py
CHANGED
|
@@ -2,6 +2,7 @@ import logging
|
|
| 2 |
import os
|
| 3 |
import gradio as gr
|
| 4 |
import pandas as pd
|
|
|
|
| 5 |
from utils import get_zotero_ids, get_arxiv_papers, get_hf_embeddings, upload_to_pinecone, get_new_papers, recommend_papers
|
| 6 |
|
| 7 |
HF_API_KEY = os.getenv('HF_API_KEY')
|
|
@@ -94,4 +95,16 @@ with gr.Blocks() as demo:
|
|
| 94 |
|
| 95 |
return results
|
| 96 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 97 |
demo.launch(share = True)
|
|
|
|
| 2 |
import os
|
| 3 |
import gradio as gr
|
| 4 |
import pandas as pd
|
| 5 |
+
from pinecone import Pinecone
|
| 6 |
from utils import get_zotero_ids, get_arxiv_papers, get_hf_embeddings, upload_to_pinecone, get_new_papers, recommend_papers
|
| 7 |
|
| 8 |
HF_API_KEY = os.getenv('HF_API_KEY')
|
|
|
|
| 95 |
|
| 96 |
return results
|
| 97 |
|
| 98 |
+
file_path = 'arxiv-scrape.csv'
|
| 99 |
+
if os.path.exists(file_path):
|
| 100 |
+
os.remove(file_path)
|
| 101 |
+
logging.info(f"{file_path} has been deleted. Delete this part of the code if you want to persist recommended papers.")
|
| 102 |
+
|
| 103 |
+
api_key = os.getenv('PINECONE_API_KEY')
|
| 104 |
+
index = os.getenv('INDEX_NAME')
|
| 105 |
+
pc = Pinecone(api_key = api_key)
|
| 106 |
+
if index in pc.list_indexes().names():
|
| 107 |
+
pc.delete_index(index)
|
| 108 |
+
logging.info(f"{index} index has been deleted from the vectordb. Delete this part of the code if you want to persist recommended papers.")
|
| 109 |
+
|
| 110 |
demo.launch(share = True)
|
utils.py
CHANGED
|
@@ -60,7 +60,7 @@ def get_hf_embeddings(api_key, df):
|
|
| 60 |
headers = {"Authorization": f"Bearer {api_key}"}
|
| 61 |
|
| 62 |
response = requests.post(API_URL, headers=headers, json={"inputs": title_abs, "wait_for_model": False})
|
| 63 |
-
print(str(response.status_code) + 'This part needs an update, causing KeyError 0')
|
| 64 |
if response.status_code == 503:
|
| 65 |
response = requests.post(API_URL, headers=headers, json={"inputs": title_abs, "wait_for_model": True})
|
| 66 |
|
|
@@ -82,6 +82,7 @@ def upload_to_pinecone(api_key, index, namespace, embeddings, dim, df):
|
|
| 82 |
name=index,
|
| 83 |
dimension=dim,
|
| 84 |
metric="cosine",
|
|
|
|
| 85 |
spec=ServerlessSpec(
|
| 86 |
cloud='aws',
|
| 87 |
region='us-east-1'
|
|
|
|
| 60 |
headers = {"Authorization": f"Bearer {api_key}"}
|
| 61 |
|
| 62 |
response = requests.post(API_URL, headers=headers, json={"inputs": title_abs, "wait_for_model": False})
|
| 63 |
+
print(str(response.status_code) + 'This part needs an update, causing KeyError 0 ')
|
| 64 |
if response.status_code == 503:
|
| 65 |
response = requests.post(API_URL, headers=headers, json={"inputs": title_abs, "wait_for_model": True})
|
| 66 |
|
|
|
|
| 82 |
name=index,
|
| 83 |
dimension=dim,
|
| 84 |
metric="cosine",
|
| 85 |
+
deletion_protection="disabled",
|
| 86 |
spec=ServerlessSpec(
|
| 87 |
cloud='aws',
|
| 88 |
region='us-east-1'
|