Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -340,7 +340,7 @@ def semantic_search(query, embeddings, model, threshold=0.5):
|
|
| 340 |
sims = cosine_similarity(query_embedding, embeddings)[0]
|
| 341 |
return [(i, s) for i, s in enumerate(sims) if s > threshold]
|
| 342 |
|
| 343 |
-
def rag_summarize(texts, summarizer, top_k=10):
|
| 344 |
if not texts:
|
| 345 |
return "No relevant content to summarize."
|
| 346 |
vect = TfidfVectorizer()
|
|
@@ -350,7 +350,7 @@ def rag_summarize(texts, summarizer, top_k=10): # increased from 5 to 10
|
|
| 350 |
top_indices = scores.argsort()[::-1][:top_k]
|
| 351 |
ctx = "\n".join(texts[i] for i in top_indices)
|
| 352 |
prompt = "summarize: " + ctx[:1024]
|
| 353 |
-
out = summarizer(prompt, max_length=
|
| 354 |
return out[0]['summary_text']
|
| 355 |
|
| 356 |
def extract_month_year(q):
|
|
|
|
| 340 |
sims = cosine_similarity(query_embedding, embeddings)[0]
|
| 341 |
return [(i, s) for i, s in enumerate(sims) if s > threshold]
|
| 342 |
|
| 343 |
+
def rag_summarize(texts, summarizer, top_k=10):
|
| 344 |
if not texts:
|
| 345 |
return "No relevant content to summarize."
|
| 346 |
vect = TfidfVectorizer()
|
|
|
|
| 350 |
top_indices = scores.argsort()[::-1][:top_k]
|
| 351 |
ctx = "\n".join(texts[i] for i in top_indices)
|
| 352 |
prompt = "summarize: " + ctx[:1024]
|
| 353 |
+
out = summarizer(prompt, max_length=200, min_length=80, do_sample=False)
|
| 354 |
return out[0]['summary_text']
|
| 355 |
|
| 356 |
def extract_month_year(q):
|