Spaces:

EugeneXiang
/

ECHOscore

Sleeping

App Files Files Community

EugeneXiang commited on Apr 20, 2025

Commit

dcf611d

verified ·

1 Parent(s): 9b414c1

Upload 5 files

Browse files

Files changed (5) hide show

config.py +33 -0
export_utils.py +22 -0
radar_chart.py +25 -0
scoring_utils.py +21 -0
slang_parser.py +7 -0

config.py ADDED Viewed

	@@ -0,0 +1,33 @@

+# 系统名称列表（展示顺序）
+SYSTEMS = ["Human", "OVAL", "DeepEval"]
+# 维度顺序（统一用于评分、图表、展示）
+DIMENSIONS = [
+    "Compliance", "Ethical", "Naturalness",
+    "Structure", "Rationality", "Logic",
+    "Non-hallucination", "Accuracy", "Coherence"
+]
+# 中文维度映射（可用于表头）
+DIMENSION_ZH = {
+    "Compliance": "合规性",
+    "Ethical": "伦理性",
+    "Naturalness": "自然度",
+    "Structure": "结构性",
+    "Rationality": "合理性",
+    "Logic": "逻辑性",
+    "Non-hallucination": "非幻觉性",
+    "Accuracy": "准确性",
+    "Coherence": "连贯性"
+}
+# 默认打分范围
+SCORE_RANGE = (0.0, 10.0)
+# 颜色配置（可用于图表）
+SYSTEM_COLORS = {
+    "Human": "#1f77b4",
+    "OVAL": "#2ca02c",
+    "DeepEval": "#ff7f0e"
+}

export_utils.py ADDED Viewed

	@@ -0,0 +1,22 @@

+import csv
+import tempfile
+def generate_csv_download(dimensions, systems, scores_data, notes, filename="evaluation_scores.csv"):
+    output = tempfile.NamedTemporaryFile(delete=False, suffix=".csv", mode="w", newline="", encoding="utf-8")
+    writer = csv.writer(output)
+    writer.writerow(["维度"] + systems)
+    for idx, dim in enumerate(dimensions):
+        row = [dim]
+        for sys in systems:
+            score = scores_data[sys][idx] if scores_data[sys][idx] is not None else ""
+            row.append(score)
+        writer.writerow(row)
+    writer.writerow([])
+    writer.writerow(["网络用语备注"])
+    writer.writerow([notes])
+    output.close()
+    return output.name

radar_chart.py ADDED Viewed

	@@ -0,0 +1,25 @@

+import plotly.graph_objects as go
+def make_radar_chart(dimensions, scores_dict):
+    fig = go.Figure()
+    for system, scores in scores_dict.items():
+        fig.add_trace(go.Scatterpolar(
+            r=[s if s is not None else 0 for s in scores],
+            theta=dimensions,
+            fill='toself',
+            name=system
+        ))
+    fig.update_layout(
+        polar=dict(
+            radialaxis=dict(visible=True, range=[0, 10])
+        ),
+        showlegend=True,
+        autosize=True,
+        margin=dict(l=0, r=0, t=20, b=0),
+        height=450
+    )
+    return fig

scoring_utils.py ADDED Viewed

	@@ -0,0 +1,21 @@

+import hashlib
+def stable_score(system, text, dimension):
+    h = hashlib.md5(f"{text}_{system}_{dimension}".encode()).hexdigest()
+    v = int(h, 16) % 41
+    return round(v / 10 + 1, 1)
+def make_explanation(system, dimension, score):
+    templates = {
+        "Structure":         f"{system} scored Structure at {score}: The text structure may be unclear; consider adding headings or breaking into paragraphs.",
+        "Rationality":       f"{system} scored Rationality at {score}: Argument support is weak; consider adding logical reasoning or evidence.",
+        "Logic":             f"{system} scored Logic at {score}: Flow seems disjointed; check for consistency and coherence between sentences.",
+        "Non-hallucination": f"{system} scored Non-hallucination at {score}: There may be inaccurate or made‑up information; please fact‑check.",
+        "Accuracy":          f"{system} scored Accuracy at {score}: Minor factual inaccuracies may exist; verify claims against reliable sources.",
+        "Coherence":         f"{system} scored Coherence at {score}: Sentences may lack a smooth narrative flow; consider rephrasing.",
+        "Compliance":        f"{system} scored Compliance at {score}: Potential issues in legal or content safety compliance detected.",
+        "Ethical":           f"{system} scored Ethical at {score}: Some content may raise ethical or cultural concerns.",
+        "Naturalness":       f"{system} scored Naturalness at {score}: The tone might sound artificial or robotic; consider improving fluency.",
+    }
+    return templates.get(dimension, f"{system} scored {dimension} at {score}.")

slang_parser.py ADDED Viewed

	@@ -0,0 +1,7 @@

+def extract_slang_notes(user_notes):
+    """
+    占位函数：用于处理用户输入的网络用语备注。
+    当前版本仅做原样返回，可扩展为检测敏感词/非规范词/风险语义等。
+    """
+    return user_notes.strip()