tjl8 commited on
Commit
4d47856
·
verified ·
1 Parent(s): 66c32bf

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -340,7 +340,7 @@ def semantic_search(query, embeddings, model, threshold=0.5):
340
  sims = cosine_similarity(query_embedding, embeddings)[0]
341
  return [(i, s) for i, s in enumerate(sims) if s > threshold]
342
 
343
- def rag_summarize(texts, summarizer, top_k=10): # increased from 5 to 10
344
  if not texts:
345
  return "No relevant content to summarize."
346
  vect = TfidfVectorizer()
@@ -350,7 +350,7 @@ def rag_summarize(texts, summarizer, top_k=10): # increased from 5 to 10
350
  top_indices = scores.argsort()[::-1][:top_k]
351
  ctx = "\n".join(texts[i] for i in top_indices)
352
  prompt = "summarize: " + ctx[:1024]
353
- out = summarizer(prompt, max_length=250, min_length=80, do_sample=False)
354
  return out[0]['summary_text']
355
 
356
  def extract_month_year(q):
 
340
  sims = cosine_similarity(query_embedding, embeddings)[0]
341
  return [(i, s) for i, s in enumerate(sims) if s > threshold]
342
 
343
+ def rag_summarize(texts, summarizer, top_k=10):
344
  if not texts:
345
  return "No relevant content to summarize."
346
  vect = TfidfVectorizer()
 
350
  top_indices = scores.argsort()[::-1][:top_k]
351
  ctx = "\n".join(texts[i] for i in top_indices)
352
  prompt = "summarize: " + ctx[:1024]
353
+ out = summarizer(prompt, max_length=200, min_length=80, do_sample=False)
354
  return out[0]['summary_text']
355
 
356
  def extract_month_year(q):