test_AI_Agent

Sleeping

SarahXia0405 commited on Dec 5, 2025

Commit

5543909

verified ·

1 Parent(s): 8a1fd1b

Update rag_engine.py

Files changed (1) hide show

rag_engine.py CHANGED Viewed

@@ -55,14 +55,20 @@ def retrieve_relevant_chunks(
     """
     用 embedding 对当前问题做一次检索，从 rag_chunks 中找出最相关的 top_k 段落，
     返回拼接后的文本，供 prompt 使用。
     """
     if not rag_chunks:
         return ""
     q_emb = get_embedding(question)
     if q_emb is None:
         return ""
     scored = []
     for item in rag_chunks:
         emb = item.get("embedding")
@@ -75,8 +81,26 @@ def retrieve_relevant_chunks(
     if not scored:
         return ""
     scored.sort(key=lambda x: x[0], reverse=True)
-    top_chunks = [t for _sim, t in scored[:top_k]]
-    # 用分隔线拼接，方便模型辨认不同片段
     return "\n---\n".join(top_chunks)

     """
     用 embedding 对当前问题做一次检索，从 rag_chunks 中找出最相关的 top_k 段落，
     返回拼接后的文本，供 prompt 使用。
+    （增强版本：将检索内容记录到 LangSmith metadata）
     """
+    from langsmith import get_current_run
+    # 1) 空安全检查
     if not rag_chunks:
         return ""
+    # 2) 问题 embedding
     q_emb = get_embedding(question)
     if q_emb is None:
         return ""
+    # 3) 计算相似度
     scored = []
     for item in rag_chunks:
         emb = item.get("embedding")
     if not scored:
         return ""
+    # 4) 按相似度排序
     scored.sort(key=lambda x: x[0], reverse=True)
+    top_items = scored[:top_k]
+    top_chunks = [t for _sim, t in top_items]
+    # 5) ⭐ 记录到 LangSmith（每个 chunk 的文本 + 相似度）
+    run = get_current_run()
+    if run:
+        run.update(
+            metadata={
+                "question": question,
+                "retrieved_chunks": [
+                    {
+                        "score": float(sim),
+                        "text_preview": text[:300],  # 避免 UI 太长，取前300字
+                    }
+                    for sim, text in top_items
+                ]
+            }
+        )
+    # 6) 返回原格式的拼接结果
     return "\n---\n".join(top_chunks)