Add official results for AlpacaEval
Browse files
README.md
CHANGED
|
@@ -128,11 +128,11 @@ model-index:
|
|
| 128 |
type: AlpacaEval
|
| 129 |
metrics:
|
| 130 |
- type: AlpacaEval 1.0
|
| 131 |
-
value: 91.
|
| 132 |
name: Win Rate
|
| 133 |
source:
|
| 134 |
-
url: https://
|
| 135 |
-
name:
|
| 136 |
- task:
|
| 137 |
type: text-generation
|
| 138 |
dataset:
|
|
@@ -140,11 +140,11 @@ model-index:
|
|
| 140 |
type: AlpacaEval
|
| 141 |
metrics:
|
| 142 |
- type: AlpacaEval 2.0
|
| 143 |
-
value: 12.
|
| 144 |
name: Win Rate
|
| 145 |
source:
|
| 146 |
-
url: https://
|
| 147 |
-
name:
|
| 148 |
- task:
|
| 149 |
type: text-generation
|
| 150 |
dataset:
|
|
|
|
| 128 |
type: AlpacaEval
|
| 129 |
metrics:
|
| 130 |
- type: AlpacaEval 1.0
|
| 131 |
+
value: 91.16%
|
| 132 |
name: Win Rate
|
| 133 |
source:
|
| 134 |
+
url: https://tatsu-lab.github.io/alpaca_eval/
|
| 135 |
+
name: Leaderboard
|
| 136 |
- task:
|
| 137 |
type: text-generation
|
| 138 |
dataset:
|
|
|
|
| 140 |
type: AlpacaEval
|
| 141 |
metrics:
|
| 142 |
- type: AlpacaEval 2.0
|
| 143 |
+
value: 12.57%
|
| 144 |
name: Win Rate
|
| 145 |
source:
|
| 146 |
+
url: https://tatsu-lab.github.io/alpaca_eval/
|
| 147 |
+
name: Leaderboard
|
| 148 |
- task:
|
| 149 |
type: text-generation
|
| 150 |
dataset:
|