Spaces:

KennyOry
/

PrintAI

Sleeping

App Files Files Community

KennyOry commited on Aug 14, 2025

Commit

5ae1040

verified ·

1 Parent(s): b5f0354

Update app.py

Browse files

Files changed (1) hide show

app.py +78 -24

app.py CHANGED Viewed

@@ -249,8 +249,8 @@ def web_search(query: str) -> tuple:
                 content = snippet  # Fallback на сниппет
             # Форматирование контента
-            relevant_content = extract_relevant_solution(content, norm_data)
-            combined_content += f"[[Источник {i+1}]] {title}\n{relevant_content}\n\n"
             # Сохранение источника
             source_data = {
@@ -303,6 +303,51 @@ def clean_response(response: str, sources: list) -> str:
     return response.strip()
 def process_query(prompt: str):
     try:
@@ -314,21 +359,28 @@ def process_query(prompt: str):
         message_queue.put(('log', f"⏏️ Извлечено: {json.dumps(norm_data, ensure_ascii=False)}"))
         search_query = norm_data['search_query']
-        message_queue.put(('log', f"🔍 Провожу поиск по запросу: {search_query}"))
-        # Получаем полный контент источников
-        _, sources = web_search(search_query)
-        # Формируем контент ТОЛЬКО из полных страниц, без сниппетов
-        full_content = ""
-        for i, source in enumerate(sources):
-            full_content += f"[[Источник {i+1}]] {source['title']}\n{source['content']}\n\n"
-        message_queue.put(('log', f"📚 Собрано: {len(full_content)} символов из {len(sources)} источников"))
-        # Генерируем ответ сразу на основе полного контента
-        message_queue.put(('log', "🧠 Генерирую ответ на основе полного контента источников..."))
-        message_queue.put(('response_start', ""))
         messages = [
             {"role": "system", "content": SYSTEM_PROMPT + f"""
@@ -336,17 +388,16 @@ def process_query(prompt: str):
             Бренд: {norm_data['brand']}
             Модель: {norm_data['model']}
             Ошибка: {norm_data['error_code']}
-            Суть проблемы: {norm_data['problem_description']}
-            ВАЖНО: Генерируй ответ ТОЛЬКО на основе предоставленных источников ниже.
-            Не выдумывай информацию, которой нет в источниках.
-            Источники:
-            {full_content}
             """},
             {"role": "user", "content": f"Проблема: {prompt}"}
         ]
         full_response = ""
         for chunk in mistral_client.chat.stream(
             model=MISTRAL_MODEL,
@@ -359,8 +410,11 @@ def process_query(prompt: str):
                 full_response += chunk_text
                 message_queue.put(('response_chunk', chunk_text))
         # Очистка и форматирование ответа
-        final_response = clean_response(full_response, sources)
         message_queue.put(('response_end', final_response))
         message_queue.put(('sources', json.dumps(sources)))

                 content = snippet  # Fallback на сниппет
             # Форматирование контента
+            cleaned_content = re.sub(r'\s+', ' ', content).strip()
+            combined_content += f"[[Источник {i+1}]] {title}\n{cleaned_content}\n\n"
             # Сохранение источника
             source_data = {
     return response.strip()
+def verify_with_sources(response: str, sources: list) -> str:
+    """Проверяет соответствие ответа источникам с помощью LLM"""
+    try:
+        message_queue.put(('log', "🔍 Проверяю соответствие ответа источникам..."))
+        sources_text = "\n\n".join([
+            f"Источник {i+1} ({source['title']}):\n{source['content'][:1500]}"
+            for i, source in enumerate(sources)
+        ])
+        verification_prompt = f"""
+        Проверь соответствие решения источникам:
+        ### Ответ бота:
+        {response}
+        ### Источники:
+        {sources_text}
+        Правила проверки:
+        1. Все шаги решения должны иметь подтверждение в источниках
+        2. Детали замены должны точно соответствовать артикулам из источников
+        3. Если в ответе есть шаги не из источников - удали их
+        4. Если есть противоречия между источниками - укажи это в решении
+        5. Если ошибки в кодах ошибок - исправь
+        6. Сохрани оригинальную структуру ответа
+        Верни исправленный ответ.
+        """
+        verification = mistral_client.chat.complete(
+            model=MISTRAL_MODEL,
+            messages=[{"role": "user", "content": verification_prompt}],
+            max_tokens=2048,
+            temperature=0.1
+        )
+        verified_response = verification.choices[0].message.content
+        return verified_response.strip()
+    except Exception as e:
+        error_msg = f"❌ Ошибка верификации: {str(e)}"
+        message_queue.put(('log', error_msg))
+        return response
 def process_query(prompt: str):
     try:
         message_queue.put(('log', f"⏏️ Извлечено: {json.dumps(norm_data, ensure_ascii=False)}"))
         search_query = norm_data['search_query']
+        search_data, sources = web_search(search_query)
+        message_queue.put(('log', f"📚 Собрано: {len(search_data)} символов в {len(sources)} источнике(-ах)"))
+        message_queue.put(('log', f"⚙️ Определяю проблему"))
+        problem_response = mistral_client.chat.complete(
+            model=MISTRAL_MODEL,
+            messages=[
+                {"role": "system", "content": "Опиши СУТЬ проблемы в одном предложении. Только диагноз, без решений. Не более 12 слов. На русском."},
+                {"role": "user", "content": f"Запрос пользователя: {prompt}\nПоисковые данные:\n{search_data}"}
+            ],
+            max_tokens=150,
+            temperature=0.2
+        )
+        extracted_problem = problem_response.choices[0].message.content.strip()
+        if not extracted_problem or len(extracted_problem) < 5:
+            extracted_problem = f"Неисправность {norm_data['brand']} {norm_data['model']}"
+        message_queue.put(('log', f"🧩 Определённая проблема: {extracted_problem}"))
+        sources_text = "\n".join([f"[{i+1}] {s['title']} - {s['url']}" for i, s in enumerate(sources)])
         messages = [
             {"role": "system", "content": SYSTEM_PROMPT + f"""
             Бренд: {norm_data['brand']}
             Модель: {norm_data['model']}
             Ошибка: {norm_data['error_code']}
+            Суть проблемы (на основе поиска): {extracted_problem}
+            Данные поиска:
+            {search_data}
             """},
             {"role": "user", "content": f"Проблема: {prompt}"}
         ]
+        message_queue.put(('log', "🧠 На основе полученных данных генерирую ответ..."))
+        message_queue.put(('response_start', ""))
         full_response = ""
         for chunk in mistral_client.chat.stream(
             model=MISTRAL_MODEL,
                 full_response += chunk_text
                 message_queue.put(('response_chunk', chunk_text))
+        # Проверка соответствия источникам
+        verified_response = verify_with_sources(full_response, sources)
         # Очистка и форматирование ответа
+        final_response = clean_response(verified_response, sources)
         message_queue.put(('response_end', final_response))
         message_queue.put(('sources', json.dumps(sources)))