Spaces:
Sleeping
Sleeping
Commit
·
0f9c9b1
1
Parent(s):
2395c5e
400 symbols to show in logging
Browse files
utils.py
CHANGED
|
@@ -120,7 +120,6 @@ def generate_sources_html(nodes, chunks_df=None):
|
|
| 120 |
section_text = metadata.get('section_text', '')
|
| 121 |
section_path = metadata.get('section_path', '')
|
| 122 |
|
| 123 |
-
# Create a unique key for grouping
|
| 124 |
if doc_type == 'table':
|
| 125 |
table_num = metadata.get('table_number', 'unknown')
|
| 126 |
key = f"{doc_id}_table_{table_num}"
|
|
@@ -128,7 +127,6 @@ def generate_sources_html(nodes, chunks_df=None):
|
|
| 128 |
image_num = metadata.get('image_number', 'unknown')
|
| 129 |
key = f"{doc_id}_image_{image_num}"
|
| 130 |
else:
|
| 131 |
-
# For text documents, group by section path or section id
|
| 132 |
section_key = section_path if section_path else section_id
|
| 133 |
key = f"{doc_id}_text_{section_key}"
|
| 134 |
|
|
@@ -215,7 +213,7 @@ def answer_question(question, query_engine, reranker, current_model, chunks_df=N
|
|
| 215 |
log_message(f" Документ: {node.metadata.get('document_id', 'unknown')}")
|
| 216 |
log_message(f" Тип: {node.metadata.get('type', 'unknown')}")
|
| 217 |
log_message(f" Раздел: {node.metadata.get('section_id', 'unknown')}")
|
| 218 |
-
log_message(f" Текст (первые
|
| 219 |
log_message(f" Метаданные: {node.metadata}")
|
| 220 |
|
| 221 |
# Переранжировка
|
|
@@ -283,17 +281,7 @@ def answer_question(question, query_engine, reranker, current_model, chunks_df=N
|
|
| 283 |
log_message(f"Ошибка обработки вопроса: {str(e)}")
|
| 284 |
error_msg = f"<div style='background-color: #e53e3e; color: white; padding: 20px; border-radius: 10px;'>Ошибка обработки вопроса: {str(e)}</div>"
|
| 285 |
return error_msg, ""
|
| 286 |
-
|
| 287 |
-
import sys
|
| 288 |
-
from llama_index.llms.google_genai import GoogleGenAI
|
| 289 |
-
from llama_index.llms.openai import OpenAI
|
| 290 |
-
from llama_index.embeddings.huggingface import HuggingFaceEmbedding
|
| 291 |
-
from sentence_transformers import CrossEncoder
|
| 292 |
-
from config import AVAILABLE_MODELS, DEFAULT_MODEL, GOOGLE_API_KEY
|
| 293 |
-
import time
|
| 294 |
-
from index_retriever import rerank_nodes
|
| 295 |
-
from my_logging import log_message
|
| 296 |
-
from config import PROMPT_SIMPLE_POISK
|
| 297 |
|
| 298 |
def get_llm_model(model_name):
|
| 299 |
try:
|
|
@@ -490,7 +478,7 @@ def answer_question(question, query_engine, reranker, current_model, chunks_df=N
|
|
| 490 |
log_message(f" Документ: {node.metadata.get('document_id', 'unknown')}")
|
| 491 |
log_message(f" Тип: {node.metadata.get('type', 'unknown')}")
|
| 492 |
log_message(f" Раздел: {node.metadata.get('section_id', 'unknown')}")
|
| 493 |
-
log_message(f" Текст (первые
|
| 494 |
log_message(f" Метаданные: {node.metadata}")
|
| 495 |
|
| 496 |
# Переранжировка
|
|
|
|
| 120 |
section_text = metadata.get('section_text', '')
|
| 121 |
section_path = metadata.get('section_path', '')
|
| 122 |
|
|
|
|
| 123 |
if doc_type == 'table':
|
| 124 |
table_num = metadata.get('table_number', 'unknown')
|
| 125 |
key = f"{doc_id}_table_{table_num}"
|
|
|
|
| 127 |
image_num = metadata.get('image_number', 'unknown')
|
| 128 |
key = f"{doc_id}_image_{image_num}"
|
| 129 |
else:
|
|
|
|
| 130 |
section_key = section_path if section_path else section_id
|
| 131 |
key = f"{doc_id}_text_{section_key}"
|
| 132 |
|
|
|
|
| 213 |
log_message(f" Документ: {node.metadata.get('document_id', 'unknown')}")
|
| 214 |
log_message(f" Тип: {node.metadata.get('type', 'unknown')}")
|
| 215 |
log_message(f" Раздел: {node.metadata.get('section_id', 'unknown')}")
|
| 216 |
+
log_message(f" Текст (первые 400 символов): {node.text[:400]}...")
|
| 217 |
log_message(f" Метаданные: {node.metadata}")
|
| 218 |
|
| 219 |
# Переранжировка
|
|
|
|
| 281 |
log_message(f"Ошибка обработки вопроса: {str(e)}")
|
| 282 |
error_msg = f"<div style='background-color: #e53e3e; color: white; padding: 20px; border-radius: 10px;'>Ошибка обработки вопроса: {str(e)}</div>"
|
| 283 |
return error_msg, ""
|
| 284 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 285 |
|
| 286 |
def get_llm_model(model_name):
|
| 287 |
try:
|
|
|
|
| 478 |
log_message(f" Документ: {node.metadata.get('document_id', 'unknown')}")
|
| 479 |
log_message(f" Тип: {node.metadata.get('type', 'unknown')}")
|
| 480 |
log_message(f" Раздел: {node.metadata.get('section_id', 'unknown')}")
|
| 481 |
+
log_message(f" Текст (первые 400 символов): {node.text[:400]}...")
|
| 482 |
log_message(f" Метаданные: {node.metadata}")
|
| 483 |
|
| 484 |
# Переранжировка
|