MaziyarPanahi
commited on
Commit
•
1ddcf7c
1
Parent(s):
1b1fc3f
Update README.md
Browse files
README.md
CHANGED
@@ -10,7 +10,7 @@ tags:
|
|
10 |
- finetune
|
11 |
- chatml
|
12 |
base_model: Qwen/Qwen2-72B-Instruct
|
13 |
-
model_name: MaziyarPanahi/
|
14 |
license_name: tongyi-qianwen
|
15 |
license_link: https://huggingface.co/Qwen/Qwen2-72B-Instruct/blob/main/LICENSE
|
16 |
pipeline_tag: text-generation
|
@@ -18,7 +18,7 @@ inference: false
|
|
18 |
model_creator: MaziyarPanahi
|
19 |
quantized_by: MaziyarPanahi
|
20 |
model-index:
|
21 |
-
- name:
|
22 |
results:
|
23 |
- task:
|
24 |
type: text-generation
|
@@ -33,7 +33,7 @@ model-index:
|
|
33 |
value: 81.63
|
34 |
name: strict accuracy
|
35 |
source:
|
36 |
-
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=MaziyarPanahi/
|
37 |
name: Open LLM Leaderboard
|
38 |
- task:
|
39 |
type: text-generation
|
@@ -48,7 +48,7 @@ model-index:
|
|
48 |
value: 57.33
|
49 |
name: normalized accuracy
|
50 |
source:
|
51 |
-
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=MaziyarPanahi/
|
52 |
name: Open LLM Leaderboard
|
53 |
- task:
|
54 |
type: text-generation
|
@@ -63,7 +63,7 @@ model-index:
|
|
63 |
value: 36.03
|
64 |
name: exact match
|
65 |
source:
|
66 |
-
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=MaziyarPanahi/
|
67 |
name: Open LLM Leaderboard
|
68 |
- task:
|
69 |
type: text-generation
|
@@ -78,7 +78,7 @@ model-index:
|
|
78 |
value: 17.45
|
79 |
name: acc_norm
|
80 |
source:
|
81 |
-
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=MaziyarPanahi/
|
82 |
name: Open LLM Leaderboard
|
83 |
- task:
|
84 |
type: text-generation
|
@@ -93,7 +93,7 @@ model-index:
|
|
93 |
value: 20.15
|
94 |
name: acc_norm
|
95 |
source:
|
96 |
-
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=MaziyarPanahi/
|
97 |
name: Open LLM Leaderboard
|
98 |
- task:
|
99 |
type: text-generation
|
@@ -110,23 +110,23 @@ model-index:
|
|
110 |
value: 49.05
|
111 |
name: accuracy
|
112 |
source:
|
113 |
-
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=MaziyarPanahi/
|
114 |
name: Open LLM Leaderboard
|
115 |
---
|
116 |
|
117 |
<img src="./qwen2-fine-tunes-maziyar-panahi.webp" alt="Qwen2 fine-tune" width="800" style="margin-left:'auto' margin-right:'auto' display:'block'"/>
|
118 |
|
119 |
-
# MaziyarPanahi/
|
120 |
|
121 |
This is a fine-tuned version of the `Qwen/Qwen2-72B-Instruct` model. It aims to improve the base model across all benchmarks.
|
122 |
|
123 |
# ⚡ Quantized GGUF
|
124 |
|
125 |
-
All GGUF models are available here: [MaziyarPanahi/
|
126 |
|
127 |
# 🏆 [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard)
|
128 |
|
129 |
-
Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/
|
130 |
|
131 |
| Metric |Value|
|
132 |
|-------------------|----:|
|
@@ -185,7 +185,7 @@ from transformers import pipeline
|
|
185 |
messages = [
|
186 |
{"role": "user", "content": "Who are you?"},
|
187 |
]
|
188 |
-
pipe = pipeline("text-generation", model="MaziyarPanahi/
|
189 |
pipe(messages)
|
190 |
|
191 |
|
@@ -193,8 +193,8 @@ pipe(messages)
|
|
193 |
|
194 |
from transformers import AutoTokenizer, AutoModelForCausalLM
|
195 |
|
196 |
-
tokenizer = AutoTokenizer.from_pretrained("MaziyarPanahi/
|
197 |
-
model = AutoModelForCausalLM.from_pretrained("MaziyarPanahi/
|
198 |
```
|
199 |
|
200 |
|
|
|
10 |
- finetune
|
11 |
- chatml
|
12 |
base_model: Qwen/Qwen2-72B-Instruct
|
13 |
+
model_name: MaziyarPanahi/calme-2.1-qwen2-72b
|
14 |
license_name: tongyi-qianwen
|
15 |
license_link: https://huggingface.co/Qwen/Qwen2-72B-Instruct/blob/main/LICENSE
|
16 |
pipeline_tag: text-generation
|
|
|
18 |
model_creator: MaziyarPanahi
|
19 |
quantized_by: MaziyarPanahi
|
20 |
model-index:
|
21 |
+
- name: calme-2.1-qwen2-72b
|
22 |
results:
|
23 |
- task:
|
24 |
type: text-generation
|
|
|
33 |
value: 81.63
|
34 |
name: strict accuracy
|
35 |
source:
|
36 |
+
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=MaziyarPanahi/calme-2.1-qwen2-72b
|
37 |
name: Open LLM Leaderboard
|
38 |
- task:
|
39 |
type: text-generation
|
|
|
48 |
value: 57.33
|
49 |
name: normalized accuracy
|
50 |
source:
|
51 |
+
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=MaziyarPanahi/calme-2.1-qwen2-72b
|
52 |
name: Open LLM Leaderboard
|
53 |
- task:
|
54 |
type: text-generation
|
|
|
63 |
value: 36.03
|
64 |
name: exact match
|
65 |
source:
|
66 |
+
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=MaziyarPanahi/calme-2.1-qwen2-72b
|
67 |
name: Open LLM Leaderboard
|
68 |
- task:
|
69 |
type: text-generation
|
|
|
78 |
value: 17.45
|
79 |
name: acc_norm
|
80 |
source:
|
81 |
+
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=MaziyarPanahi/calme-2.1-qwen2-72b
|
82 |
name: Open LLM Leaderboard
|
83 |
- task:
|
84 |
type: text-generation
|
|
|
93 |
value: 20.15
|
94 |
name: acc_norm
|
95 |
source:
|
96 |
+
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=MaziyarPanahi/calme-2.1-qwen2-72b
|
97 |
name: Open LLM Leaderboard
|
98 |
- task:
|
99 |
type: text-generation
|
|
|
110 |
value: 49.05
|
111 |
name: accuracy
|
112 |
source:
|
113 |
+
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=MaziyarPanahi/calme-2.1-qwen2-72b
|
114 |
name: Open LLM Leaderboard
|
115 |
---
|
116 |
|
117 |
<img src="./qwen2-fine-tunes-maziyar-panahi.webp" alt="Qwen2 fine-tune" width="800" style="margin-left:'auto' margin-right:'auto' display:'block'"/>
|
118 |
|
119 |
+
# MaziyarPanahi/calme-2.1-qwen2-72b
|
120 |
|
121 |
This is a fine-tuned version of the `Qwen/Qwen2-72B-Instruct` model. It aims to improve the base model across all benchmarks.
|
122 |
|
123 |
# ⚡ Quantized GGUF
|
124 |
|
125 |
+
All GGUF models are available here: [MaziyarPanahi/calme-2.1-qwen2-72b-GGUF](https://huggingface.co/MaziyarPanahi/calme-2.1-qwen2-72b-GGUF)
|
126 |
|
127 |
# 🏆 [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard)
|
128 |
|
129 |
+
Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_MaziyarPanahi__calme-2.1-qwen2-72b)
|
130 |
|
131 |
| Metric |Value|
|
132 |
|-------------------|----:|
|
|
|
185 |
messages = [
|
186 |
{"role": "user", "content": "Who are you?"},
|
187 |
]
|
188 |
+
pipe = pipeline("text-generation", model="MaziyarPanahi/calme-2.1-qwen2-72b")
|
189 |
pipe(messages)
|
190 |
|
191 |
|
|
|
193 |
|
194 |
from transformers import AutoTokenizer, AutoModelForCausalLM
|
195 |
|
196 |
+
tokenizer = AutoTokenizer.from_pretrained("MaziyarPanahi/calme-2.1-qwen2-72b")
|
197 |
+
model = AutoModelForCausalLM.from_pretrained("MaziyarPanahi/calme-2.1-qwen2-72b")
|
198 |
```
|
199 |
|
200 |
|