Update README.md
Browse files
README.md
CHANGED
|
@@ -112,21 +112,21 @@ Average: 68.75%
|
|
| 112 |
|
| 113 |
| Task | Version | Metric | Value | StdErr |
|
| 114 |
| --- | --- | --- | --- | --- |
|
| 115 |
-
| agieval\_aqua\_rat | | acc | 28.35 | 2.83 |
|
| 116 |
| | | acc\_norm | 26.38 | 2.77 |
|
| 117 |
-
| agieval\_logiqa\_en | | acc | 38.25 | 1.91 |
|
| 118 |
| | | acc\_norm | 38.09 | 1.90 |
|
| 119 |
-
| agieval\_lsat\_ar | | acc | 23.91 | 2.82 |
|
| 120 |
| | | acc\_norm | 23.48 | 2.80 |
|
| 121 |
-
| agieval\_lsat\_lr | | acc | 52.75 | 2.21 |
|
| 122 |
| | | acc\_norm | 53.92 | 2.21 |
|
| 123 |
-
| agieval\_lsat\_rc |
|
| 124 |
| | | acc\_norm | 67.29 | 2.87 |
|
| 125 |
-
| agieval\_sat\_en | | acc | 78.64 | 2.86 |
|
| 126 |
| | | acc\_norm | 78.64 | 2.86 |
|
| 127 |
-
| agieval\_sat\_en\_without\_passage | | acc | 45.15 | 3.48 |
|
| 128 |
| | | acc\_norm | 44.17 | 3.47 |
|
| 129 |
-
| agieval\_sat\_math | | acc | 33.18 | 3.18 |
|
| 130 |
| | | acc\_norm | 31.36 | 3.14 |
|
| 131 |
|
| 132 |
Average: 47.44%
|
|
|
|
| 112 |
|
| 113 |
| Task | Version | Metric | Value | StdErr |
|
| 114 |
| --- | --- | --- | --- | --- |
|
| 115 |
+
| agieval\_aqua\_rat | 0| acc | 28.35 | 2.83 |
|
| 116 |
| | | acc\_norm | 26.38 | 2.77 |
|
| 117 |
+
| agieval\_logiqa\_en | 0| acc | 38.25 | 1.91 |
|
| 118 |
| | | acc\_norm | 38.09 | 1.90 |
|
| 119 |
+
| agieval\_lsat\_ar | 0| acc | 23.91 | 2.82 |
|
| 120 |
| | | acc\_norm | 23.48 | 2.80 |
|
| 121 |
+
| agieval\_lsat\_lr | 0| acc | 52.75 | 2.21 |
|
| 122 |
| | | acc\_norm | 53.92 | 2.21 |
|
| 123 |
+
| agieval\_lsat\_rc | 0 | acc | 66.91 | 2.87 |
|
| 124 |
| | | acc\_norm | 67.29 | 2.87 |
|
| 125 |
+
| agieval\_sat\_en | 0| acc | 78.64 | 2.86 |
|
| 126 |
| | | acc\_norm | 78.64 | 2.86 |
|
| 127 |
+
| agieval\_sat\_en\_without\_passage | 0| acc | 45.15 | 3.48 |
|
| 128 |
| | | acc\_norm | 44.17 | 3.47 |
|
| 129 |
+
| agieval\_sat\_math | 0| acc | 33.18 | 3.18 |
|
| 130 |
| | | acc\_norm | 31.36 | 3.14 |
|
| 131 |
|
| 132 |
Average: 47.44%
|