ArkaAbacus
commited on
Commit
•
52c5409
1
Parent(s):
a840a3d
Update README.md
Browse files
README.md
CHANGED
@@ -36,7 +36,7 @@ Score vs selected others (sourced from: (https://lmsys.org/blog/2024-04-19-arena
|
|
36 |
| :---- | ---------: | ----------: | ------: |
|
37 |
| GPT-4-Turbo-2024-04-09 | 82.6 | (-1.8, 1.6) | 662 |
|
38 |
| Claude-3-Opus-20240229 | 60.4 | (-3.3, 2.4) | 541 |
|
39 |
-
| **Smaug-Llama-3-70B-Instruct
|
40 |
| Llama-3-70B-Instruct | 41.1 | (-2.5, 2.4) | 583 |
|
41 |
| Mistral-Large-2402 | 37.7 | (-1.9, 2.6) | 400 |
|
42 |
| Mixtral-8x22B-Instruct-v0.1 | 36.4 | (-2.7, 2.9) | 430 |
|
@@ -70,7 +70,7 @@ Meta-Llama-3-70B-Instruct 9.006250
|
|
70 |
|
71 |
| Model | First turn | Second Turn | Average |
|
72 |
| :---- | ---------: | ----------: | ------: |
|
73 |
-
| Smaug-Llama-3-70B-Instruct | 9.40 | 9.01 | 9.21 |
|
74 |
| GPT-4-Turbo | 9.38 | 9.00 | 9.19 |
|
75 |
| Meta-Llama-3-70B-Instruct | 9.21 | 8.80 | 9.01 |
|
76 |
|
|
|
36 |
| :---- | ---------: | ----------: | ------: |
|
37 |
| GPT-4-Turbo-2024-04-09 | 82.6 | (-1.8, 1.6) | 662 |
|
38 |
| Claude-3-Opus-20240229 | 60.4 | (-3.3, 2.4) | 541 |
|
39 |
+
| **Smaug-Llama-3-70B-Instruct** | 56.7 | (-2.2, 2.6) | 661 |
|
40 |
| Llama-3-70B-Instruct | 41.1 | (-2.5, 2.4) | 583 |
|
41 |
| Mistral-Large-2402 | 37.7 | (-1.9, 2.6) | 400 |
|
42 |
| Mixtral-8x22B-Instruct-v0.1 | 36.4 | (-2.7, 2.9) | 430 |
|
|
|
70 |
|
71 |
| Model | First turn | Second Turn | Average |
|
72 |
| :---- | ---------: | ----------: | ------: |
|
73 |
+
| **Smaug-Llama-3-70B-Instruct** | 9.40 | 9.01 | 9.21 |
|
74 |
| GPT-4-Turbo | 9.38 | 9.00 | 9.19 |
|
75 |
| Meta-Llama-3-70B-Instruct | 9.21 | 8.80 | 9.01 |
|
76 |
|