cloudyu cherry0328 commited on
Commit
2af346d
·
verified ·
1 Parent(s): be27e1d

Update README.md (#17)

Browse files

- Update README.md (201bbe55d30efe0d117cb1d4f7e09b7596a7908a)


Co-authored-by: cherry0328 <cherry0328@users.noreply.huggingface.co>

Files changed (1) hide show
  1. README.md +16 -8
README.md CHANGED
@@ -19,7 +19,8 @@ model-index:
19
  value: 45.38
20
  name: strict accuracy
21
  source:
22
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
 
23
  name: Open LLM Leaderboard
24
  - task:
25
  type: text-generation
@@ -34,7 +35,8 @@ model-index:
34
  value: 41.21
35
  name: normalized accuracy
36
  source:
37
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
 
38
  name: Open LLM Leaderboard
39
  - task:
40
  type: text-generation
@@ -49,7 +51,8 @@ model-index:
49
  value: 6.57
50
  name: exact match
51
  source:
52
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
 
53
  name: Open LLM Leaderboard
54
  - task:
55
  type: text-generation
@@ -64,7 +67,8 @@ model-index:
64
  value: 11.74
65
  name: acc_norm
66
  source:
67
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
 
68
  name: Open LLM Leaderboard
69
  - task:
70
  type: text-generation
@@ -79,7 +83,8 @@ model-index:
79
  value: 17.78
80
  name: acc_norm
81
  source:
82
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
 
83
  name: Open LLM Leaderboard
84
  - task:
85
  type: text-generation
@@ -96,8 +101,12 @@ model-index:
96
  value: 41.85
97
  name: accuracy
98
  source:
99
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
 
100
  name: Open LLM Leaderboard
 
 
 
101
  ---
102
 
103
  # Mixtral MOE 2x34B
@@ -220,5 +229,4 @@ Detailed results can be found [here](https://huggingface.co/datasets/open-llm-le
220
  |MATH Lvl 5 (4-Shot)| 6.57|
221
  |GPQA (0-shot) |11.74|
222
  |MuSR (0-shot) |17.78|
223
- |MMLU-PRO (5-shot) |41.85|
224
-
 
19
  value: 45.38
20
  name: strict accuracy
21
  source:
22
+ url: >-
23
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
24
  name: Open LLM Leaderboard
25
  - task:
26
  type: text-generation
 
35
  value: 41.21
36
  name: normalized accuracy
37
  source:
38
+ url: >-
39
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
40
  name: Open LLM Leaderboard
41
  - task:
42
  type: text-generation
 
51
  value: 6.57
52
  name: exact match
53
  source:
54
+ url: >-
55
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
56
  name: Open LLM Leaderboard
57
  - task:
58
  type: text-generation
 
67
  value: 11.74
68
  name: acc_norm
69
  source:
70
+ url: >-
71
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
72
  name: Open LLM Leaderboard
73
  - task:
74
  type: text-generation
 
83
  value: 17.78
84
  name: acc_norm
85
  source:
86
+ url: >-
87
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
88
  name: Open LLM Leaderboard
89
  - task:
90
  type: text-generation
 
101
  value: 41.85
102
  name: accuracy
103
  source:
104
+ url: >-
105
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=cloudyu/Mixtral_34Bx2_MoE_60B
106
  name: Open LLM Leaderboard
107
+ base_model:
108
+ - jondurbin/bagel-dpo-34b-v0.2
109
+ - SUSTech/SUS-Chat-34B
110
  ---
111
 
112
  # Mixtral MOE 2x34B
 
229
  |MATH Lvl 5 (4-Shot)| 6.57|
230
  |GPQA (0-shot) |11.74|
231
  |MuSR (0-shot) |17.78|
232
+ |MMLU-PRO (5-shot) |41.85|