Update README.md
Browse files
README.md
CHANGED
@@ -26,7 +26,7 @@ Nxcode-CQ-7B-orpo is an ORPO fine-tune of Qwen/CodeQwen1.5-7B-Chat on 100k sampl
|
|
26 |
| EvalPlus | pass@1 |
|
27 |
| --- | --- |
|
28 |
| HumanEval | 86.0 |
|
29 |
-
|
|
30 |
|
31 |
[Evalplus Leaderboard](https://evalplus.github.io/leaderboard.html)
|
32 |
| Models | HumanEval | HumanEval+|
|
@@ -36,6 +36,12 @@ Nxcode-CQ-7B-orpo is an ORPO fine-tune of Qwen/CodeQwen1.5-7B-Chat on 100k sampl
|
|
36 |
| GPT-4-Turbo (Nov 2023)| 85.4| 79.3|
|
37 |
| CodeQwen1.5-7B-Chat| 83.5| 78.7|
|
38 |
| claude-3-opus (Mar 2024)| 82.9| 76.8|
|
|
|
|
|
|
|
|
|
|
|
|
|
39 |
|
40 |
## Quickstart
|
41 |
|
|
|
26 |
| EvalPlus | pass@1 |
|
27 |
| --- | --- |
|
28 |
| HumanEval | 86.0 |
|
29 |
+
| HumanEval+ | 81.1 |
|
30 |
|
31 |
[Evalplus Leaderboard](https://evalplus.github.io/leaderboard.html)
|
32 |
| Models | HumanEval | HumanEval+|
|
|
|
36 |
| GPT-4-Turbo (Nov 2023)| 85.4| 79.3|
|
37 |
| CodeQwen1.5-7B-Chat| 83.5| 78.7|
|
38 |
| claude-3-opus (Mar 2024)| 82.9| 76.8|
|
39 |
+
| DeepSeek-Coder-33B-instruct| 81.1| 75.0|
|
40 |
+
| WizardCoder-33B-V1.1| 79.9| 73.2|
|
41 |
+
| OpenCodeInterpreter-DS-33B| 79.3| 73.8|
|
42 |
+
| speechless-codellama-34B-v2.0| 77.4| 72|
|
43 |
+
| GPT-3.5-Turbo (Nov 2023)| 76.8| 70.7|
|
44 |
+
| Llama3-70B-instruct| 76.2| 70.7|
|
45 |
|
46 |
## Quickstart
|
47 |
|