Spaces:

awinml
/

2-qa-earnings-sentencewise

Build error

App Files Files Community

awinml commited on Mar 13, 2023

Commit

6966109

1 Parent(s): ac5b87a

Upload 2 files

Browse files

Files changed (1) hide show

utils.py +25 -18

utils.py CHANGED Viewed

@@ -64,13 +64,12 @@ def save_key(api_key):
 def query_pinecone(
     query, top_k, model, index, year, quarter, ticker, participant_type, threshold=0.25
 ):
-    # generate embeddings for the query
-    xq = model.encode([query]).tolist()
     if participant_type == "Company Speaker":
-        participant = "Speaker"
     else:
-        participant = participant_type
     if year == "All":
         if quarter == "All":
@@ -126,7 +125,6 @@ def query_pinecone(
             },
             include_metadata=True,
         )
     # filter the context passages based on the score threshold
     filtered_matches = []
     for match in xc["matches"]:
@@ -167,7 +165,7 @@ def text_lookup(data, sentence_ids):
 def generate_prompt(query_text, context_list):
     context = " ".join(context_list)
-    prompt = f"""Answer the question as accurately as possible using the provided context. Try to include as many key details as possible.
 Context: {context}
 Question: {query_text}
 Answer:"""
@@ -204,17 +202,26 @@ def gpt_model(prompt):
 def retrieve_transcript(data, year, quarter, ticker):
-    row = (
-        data.loc[
-            (data.Year == int(year))
-            & (data.Quarter == quarter)
-            & (data.Ticker == ticker),
-            ["File_Name"],
-        ]
-        .drop_duplicates()
-        .iloc[0, 0]
-    )
-    print(row)
     # convert row to a string and join values with "-"
     # row_str = "-".join(row.astype(str)) + ".txt"
     open_file = open(

 def query_pinecone(
     query, top_k, model, index, year, quarter, ticker, participant_type, threshold=0.25
 ):
     if participant_type == "Company Speaker":
+        participant = "Answer"
     else:
+        participant = "Question"
+    # generate embeddings for the query
+    xq = model.encode([query]).tolist()
     if year == "All":
         if quarter == "All":
             },
             include_metadata=True,
         )
     # filter the context passages based on the score threshold
     filtered_matches = []
     for match in xc["matches"]:
 def generate_prompt(query_text, context_list):
     context = " ".join(context_list)
+    prompt = f"""Answer the question in 5 detailed points as accurately as possible using the provided context. Try to include as many key details as possible.
 Context: {context}
 Question: {query_text}
 Answer:"""
 def retrieve_transcript(data, year, quarter, ticker):
+    if year == "All" or quarter == "All":
+        row = (
+            data.loc[
+                (data.Ticker == ticker),
+                ["File_Name"],
+            ]
+            .drop_duplicates()
+            .iloc[0, 0]
+        )
+    else:
+        row = (
+            data.loc[
+                (data.Year == int(year))
+                & (data.Quarter == quarter)
+                & (data.Ticker == ticker),
+                ["File_Name"],
+            ]
+            .drop_duplicates()
+            .iloc[0, 0]
+        )
     # convert row to a string and join values with "-"
     # row_str = "-".join(row.astype(str)) + ".txt"
     open_file = open(