test_AI_Agent

Sleeping

App Files Files Community

SarahXia0405 commited on Dec 5, 2025

Commit

e440afe

verified ·

1 Parent(s): 7bd3326

Update rag_engine.py

Browse files

Files changed (1) hide show

rag_engine.py +15 -22

rag_engine.py CHANGED Viewed

@@ -7,6 +7,7 @@ from clare_core import (
     cosine_similarity,
 )
 from langsmith import traceable
 def build_rag_chunks_from_file(file, doc_type_val: str) -> List[Dict]:
@@ -57,18 +58,13 @@ def retrieve_relevant_chunks(
     返回拼接后的文本，供 prompt 使用。
     （增强版本：将检索内容记录到 LangSmith metadata）
     """
-    from langsmith import get_current_run
-    # 1) 空安全检查
     if not rag_chunks:
         return ""
-    # 2) 问题 embedding
     q_emb = get_embedding(question)
     if q_emb is None:
         return ""
-    # 3) 计算相似度
     scored = []
     for item in rag_chunks:
         emb = item.get("embedding")
@@ -81,26 +77,23 @@ def retrieve_relevant_chunks(
     if not scored:
         return ""
-    # 4) 按相似度排序
     scored.sort(key=lambda x: x[0], reverse=True)
     top_items = scored[:top_k]
     top_chunks = [t for _sim, t in top_items]
-    # 5) ⭐ 记录到 LangSmith（每个 chunk 的文本 + 相似度）
-    run = get_current_run()
-    if run:
-        run.update(
-            metadata={
-                "question": question,
-                "retrieved_chunks": [
-                    {
-                        "score": float(sim),
-                        "text_preview": text[:300],  # 避免 UI 太长，取前300字
-                    }
-                    for sim, text in top_items
-                ]
-            }
         )
-    # 6) 返回原格式的拼接结果
-    return "\n---\n".join(top_chunks)

     cosine_similarity,
 )
 from langsmith import traceable
+from langsmith.run_helpers import set_run_metadata
 def build_rag_chunks_from_file(file, doc_type_val: str) -> List[Dict]:
     返回拼接后的文本，供 prompt 使用。
     （增强版本：将检索内容记录到 LangSmith metadata）
     """
     if not rag_chunks:
         return ""
     q_emb = get_embedding(question)
     if q_emb is None:
         return ""
     scored = []
     for item in rag_chunks:
         emb = item.get("embedding")
     if not scored:
         return ""
     scored.sort(key=lambda x: x[0], reverse=True)
     top_items = scored[:top_k]
     top_chunks = [t for _sim, t in top_items]
+    # 使用 set_run_metadata 给当前 retriever run 打 metadata
+    try:
+        previews = [
+            {"score": float(sim), "text_preview": text[:300]}
+            for sim, text in top_items
+        ]
+        set_run_metadata(
+            question=question,
+            retrieved_chunks=previews,
         )
+    except Exception as e:
+        # observability 出错不能影响主流程
+        print(f"[LangSmith metadata error in retrieve_relevant_chunks] {repr(e)}")
+    # 用分隔线拼接，方便模型辨认不同片段
+    return "\n---\n".join(top_chunks)