Removed LLM init, Changed Reranker to be reversed
Browse files
app.py
CHANGED
|
@@ -241,7 +241,7 @@ class BSIChatbot:
|
|
| 241 |
|
| 242 |
#self.vectorstore.
|
| 243 |
#retrieved_chunks = self.vectorstore.similarity_search(query=query, k=20)
|
| 244 |
-
retrieved_chunks = vectorstore.similarity_search(query=query, k=
|
| 245 |
#finalchunks = []
|
| 246 |
#for chunk in retrieved_chunks:
|
| 247 |
# if "---" not in chunk.page_content:
|
|
@@ -432,8 +432,12 @@ class BSIChatbot:
|
|
| 432 |
self.initializeRerankingModel()
|
| 433 |
print("Starting Reranking Chunks...")
|
| 434 |
rerankingModel
|
| 435 |
-
retrieved_chunks_text=rerankingModel.rerank(query, retrieved_chunks_text,k=
|
| 436 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 437 |
|
| 438 |
i = 1
|
| 439 |
for chunk in retrieved_chunks_text:
|
|
@@ -489,7 +493,7 @@ if __name__ == '__main__':
|
|
| 489 |
#bot.retrieveSimiliarEmbedding("Was ist der IT-Grundschutz?")
|
| 490 |
#TODO: DEBUG:
|
| 491 |
#time.sleep(10)
|
| 492 |
-
bot.initializeLLM()
|
| 493 |
#bot.retrieveSimiliarEmbedding("Welche Typen von Anforderungen gibt es im IT-Grundschutz?")
|
| 494 |
|
| 495 |
#bot.queryLLM("Welche Typen von Anforderungen gibt es im IT-Grundschutz?")
|
|
|
|
| 241 |
|
| 242 |
#self.vectorstore.
|
| 243 |
#retrieved_chunks = self.vectorstore.similarity_search(query=query, k=20)
|
| 244 |
+
retrieved_chunks = vectorstore.similarity_search(query=query, k=30)
|
| 245 |
#finalchunks = []
|
| 246 |
#for chunk in retrieved_chunks:
|
| 247 |
# if "---" not in chunk.page_content:
|
|
|
|
| 432 |
self.initializeRerankingModel()
|
| 433 |
print("Starting Reranking Chunks...")
|
| 434 |
rerankingModel
|
| 435 |
+
retrieved_chunks_text=rerankingModel.rerank(query, retrieved_chunks_text,k=15)
|
| 436 |
+
#REVERSE Rerank results!
|
| 437 |
+
print("DBG: Rankorder:")
|
| 438 |
+
for chunk in reversed(retrieved_chunks_text):
|
| 439 |
+
print(chunk.rank)
|
| 440 |
+
retrieved_chunks_text=[chunk["content"] for chunk in reversed(retrieved_chunks_text)]
|
| 441 |
|
| 442 |
i = 1
|
| 443 |
for chunk in retrieved_chunks_text:
|
|
|
|
| 493 |
#bot.retrieveSimiliarEmbedding("Was ist der IT-Grundschutz?")
|
| 494 |
#TODO: DEBUG:
|
| 495 |
#time.sleep(10)
|
| 496 |
+
#bot.initializeLLM()
|
| 497 |
#bot.retrieveSimiliarEmbedding("Welche Typen von Anforderungen gibt es im IT-Grundschutz?")
|
| 498 |
|
| 499 |
#bot.queryLLM("Welche Typen von Anforderungen gibt es im IT-Grundschutz?")
|