Files changed (1) hide show
  1. src/about.py +47 -1
src/about.py CHANGED
@@ -1,13 +1,26 @@
1
  from dataclasses import dataclass
2
  from enum import Enum
3
-
4
  @dataclass
5
  class Task:
6
  benchmark: str
7
  metric: str
8
  col_name: str
9
 
 
 
 
 
 
 
 
 
 
 
 
 
10
 
 
11
  # Select your tasks here
12
  # ---------------------------------------------------
13
  class Tasks(Enum):
@@ -70,3 +83,36 @@ If everything is done, check you can launch the EleutherAIHarness on your model
70
  CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
71
  CITATION_BUTTON_TEXT = r"""
72
  """
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  from dataclasses import dataclass
2
  from enum import Enum
3
+ from pathlib import Path
4
  @dataclass
5
  class Task:
6
  benchmark: str
7
  metric: str
8
  col_name: str
9
 
10
+ REPORT_MD_PATH = Path(__file__).parent.parent / "Files" / "report.md"
11
+ with open(REPORT_MD_PATH, "r", encoding="utf-8") as f:
12
+ REPORT_TEXT = f.read()
13
+
14
+ TITLE = "# LLM Benchmark Leaderboard"
15
+
16
+ # 替换LLM_BENCHMARKS_TEXT为report.md内容
17
+ LLM_BENCHMARKS_TEXT = REPORT_TEXT
18
+
19
+ CITATION_BUTTON_LABEL = "📖 Citation"
20
+ CITATION_BUTTON_TEXT = """If you use this benchmark, please cite: ...
21
+ (原citation内容保留)"""
22
 
23
+ EVALUATION_QUEUE_TEXT = "Models submitted for evaluation will appear here."
24
  # Select your tasks here
25
  # ---------------------------------------------------
26
  class Tasks(Enum):
 
83
  CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
84
  CITATION_BUTTON_TEXT = r"""
85
  """
86
+ # Report
87
+
88
+ ## 1. 模型及类别选择
89
+
90
+ 本次实验选用了三类大模型:Llama 3, Mistral 7B, ChatGPT。
91
+
92
+ - **Llama 3**:开源社区广泛使用,适合中英文任务。
93
+ - **Mistral 7B**:轻量级,适合边缘设备。
94
+ - **ChatGPT**:闭源,适合通用对话任务,表现最优。
95
+
96
+ | 模型名称 | 参数量 | 开源情况 | 主要用途 |
97
+ |------------|--------|---------|----------------|
98
+ | Llama 3 | 70B | 是 | 多语言任务 |
99
+ | Mistral 7B | 7B | 是 | 低功耗推理任务 |
100
+ | ChatGPT | 未公开 | 否 | 通用对话、推理任务 |
101
+
102
+ **选择理由**:
103
+ - Llama 3和Mistral为开源,方便定制与修改;
104
+ - ChatGPT性能优越,作为基准。
105
+
106
+ ---
107
+
108
+ ## 2. 系统实现细节
109
+
110
+ ### Gradio交互界面截图
111
+ ![Gradio界面](./interface.png)
112
+
113
+ ### 输入与输出流程图
114
+ ```mermaid
115
+ graph TD
116
+ A[用户输入] --> B[Gradio界面]
117
+ B --> C[模型推理]
118
+ C --> D[返回结果]