Update README.md
Browse files
README.md
CHANGED
@@ -126,6 +126,8 @@ All results below, except those for `Xwen-72B-Chat`, are sourced from [Arena-Har
|
|
126 |
| Llama-3.1-8B-Instruct π | 21.3 | (-1.9, 2.2) |
|
127 |
| Llama-3-8B-Instruct π | 20.6 | (-2.0, 1.9) |
|
128 |
| Starling-LM-7B-beta π | 23.0 | (-1.8, 1.8) |
|
|
|
|
|
129 |
|
130 |
|
131 |
|
@@ -160,6 +162,8 @@ All results below, except those for `Xwen-72B-Chat`, are sourced from [Arena-Har
|
|
160 |
| Llama-3.1-8B-Instruct π | 18.3 | (-1.6, 1.6) |
|
161 |
| Llama-3-8B-Instruct π | 19.8 | (-1.6, 1.9) |
|
162 |
| Starling-LM-7B-beta π | 26.1 | (-2.6, 2.0) |
|
|
|
|
|
163 |
|
164 |
|
165 |
### 3.2 AlignBench-v1.1
|
|
|
126 |
| Llama-3.1-8B-Instruct π | 21.3 | (-1.9, 2.2) |
|
127 |
| Llama-3-8B-Instruct π | 20.6 | (-2.0, 1.9) |
|
128 |
| Starling-LM-7B-beta π | 23.0 | (-1.8, 1.8) |
|
129 |
+
| DeepSeek-R1-Distill-Qwen-7B (only responses) π | 17.2 | (-1.4, 1.7) |
|
130 |
+
| DeepSeek-R1-Distill-Qwen-7B (w/ thoughts and responses) π | 13.6 | (-1.4, 1.8) |
|
131 |
|
132 |
|
133 |
|
|
|
162 |
| Llama-3.1-8B-Instruct π | 18.3 | (-1.6, 1.6) |
|
163 |
| Llama-3-8B-Instruct π | 19.8 | (-1.6, 1.9) |
|
164 |
| Starling-LM-7B-beta π | 26.1 | (-2.6, 2.0) |
|
165 |
+
| DeepSeek-R1-Distill-Qwen-7B (only responses) π | 18.5 | (-1.6, 1.8) |
|
166 |
+
| DeepSeek-R1-Distill-Qwen-7B (w/ thoughts and responses) π | 11.8 | (-1.6, 1.6) |
|
167 |
|
168 |
|
169 |
### 3.2 AlignBench-v1.1
|