Spaces:
Sleeping
Sleeping
Commit
·
c0c8ab9
1
Parent(s):
e04e66f
top k reranker = 25, max rows = 5, max chars= 4000
Browse files- documents_prep.py +1 -1
- utils.py +1 -1
documents_prep.py
CHANGED
|
@@ -38,7 +38,7 @@ def chunk_text_documents(documents):
|
|
| 38 |
return chunked
|
| 39 |
|
| 40 |
|
| 41 |
-
def chunk_table_by_rows(table_data, doc_id, rows_per_chunk=
|
| 42 |
"""
|
| 43 |
Chunk tables by rows with fallback to character limit.
|
| 44 |
Keeps 3-4 rows together, but splits individual rows if they're too large.
|
|
|
|
| 38 |
return chunked
|
| 39 |
|
| 40 |
|
| 41 |
+
def chunk_table_by_rows(table_data, doc_id, rows_per_chunk=5, max_chars=4000):
|
| 42 |
"""
|
| 43 |
Chunk tables by rows with fallback to character limit.
|
| 44 |
Keeps 3-4 rows together, but splits individual rows if they're too large.
|
utils.py
CHANGED
|
@@ -47,7 +47,7 @@ def answer_question(question, query_engine, reranker):
|
|
| 47 |
retrieved = query_engine.retrieve(question)
|
| 48 |
log_message(f"RETRIEVED: {len(retrieved)} unique nodes")
|
| 49 |
|
| 50 |
-
reranked = rerank_nodes(question, retrieved, reranker, top_k=
|
| 51 |
log_message(f"RERANKED: {len(reranked)} nodes")
|
| 52 |
|
| 53 |
# Group by document and type
|
|
|
|
| 47 |
retrieved = query_engine.retrieve(question)
|
| 48 |
log_message(f"RETRIEVED: {len(retrieved)} unique nodes")
|
| 49 |
|
| 50 |
+
reranked = rerank_nodes(question, retrieved, reranker, top_k=25, min_score=-0.5)
|
| 51 |
log_message(f"RERANKED: {len(reranked)} nodes")
|
| 52 |
|
| 53 |
# Group by document and type
|