Spaces:
Sleeping
Sleeping
feat(huggingchat): Model update 24/09/2024 (#1485)
Browse files- chart/env/prod.yaml +53 -71
chart/env/prod.yaml
CHANGED
|
@@ -53,9 +53,8 @@ envVars:
|
|
| 53 |
"tools": true,
|
| 54 |
"preprompt": "",
|
| 55 |
"parameters": {
|
| 56 |
-
"temperature": 0.6,
|
| 57 |
-
"top_p": 0.9,
|
| 58 |
"stop": ["<|endoftext|>", "<|eot_id|>"],
|
|
|
|
| 59 |
"max_new_tokens": 1024,
|
| 60 |
"truncate": 7167
|
| 61 |
},
|
|
@@ -115,42 +114,10 @@ envVars:
|
|
| 115 |
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/qwen-logo.png",
|
| 116 |
"preprompt": "You are Qwen, created by Alibaba Cloud. You are a helpful assistant.",
|
| 117 |
"parameters": {
|
| 118 |
-
"temperature": 0.6,
|
| 119 |
"stop": ["<|endoftext|>", "<|im_end|>"],
|
| 120 |
-
"truncate": 28672,
|
| 121 |
-
"max_new_tokens": 3072,
|
| 122 |
-
},
|
| 123 |
-
"promptExamples": [
|
| 124 |
-
{
|
| 125 |
-
"title": "Write an email from bullet list",
|
| 126 |
-
"prompt": "As a restaurant owner, write a professional email to the supplier to get these products every week: \n\n- Wine (x10)\n- Eggs (x24)\n- Bread (x12)"
|
| 127 |
-
},
|
| 128 |
-
{
|
| 129 |
-
"title": "Code a snake game",
|
| 130 |
-
"prompt": "Code a basic snake game in python, give explanations for each step."
|
| 131 |
-
},
|
| 132 |
-
{
|
| 133 |
-
"title": "Assist in a task",
|
| 134 |
-
"prompt": "How do I make a delicious lemon cheesecake?"
|
| 135 |
-
}
|
| 136 |
-
]
|
| 137 |
-
},
|
| 138 |
-
{
|
| 139 |
-
"name": "mistralai/Mixtral-8x7B-Instruct-v0.1",
|
| 140 |
-
"description": "A high-quality sparse mixture of experts model with open weights.",
|
| 141 |
-
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/mistral-logo.png",
|
| 142 |
-
"websiteUrl": "https://mistral.ai/news/mixtral-of-experts/",
|
| 143 |
-
"modelUrl": "https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1",
|
| 144 |
-
"tokenizer": "mistralai/Mixtral-8x7B-Instruct-v0.1",
|
| 145 |
-
"preprompt": "",
|
| 146 |
-
"parameters": {
|
| 147 |
"temperature": 0.6,
|
| 148 |
-
"
|
| 149 |
-
"
|
| 150 |
-
"top_k": 50,
|
| 151 |
-
"truncate": 24576,
|
| 152 |
-
"max_new_tokens": 8192,
|
| 153 |
-
"stop": ["</s>"]
|
| 154 |
},
|
| 155 |
"promptExamples": [
|
| 156 |
{
|
|
@@ -168,12 +135,12 @@ envVars:
|
|
| 168 |
]
|
| 169 |
},
|
| 170 |
{
|
| 171 |
-
"name": "NousResearch/
|
| 172 |
-
"description": "Nous
|
| 173 |
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/nous-logo.png",
|
| 174 |
"websiteUrl": "https://nousresearch.com/",
|
| 175 |
-
"modelUrl": "https://huggingface.co/NousResearch/
|
| 176 |
-
"tokenizer": "NousResearch/
|
| 177 |
"promptExamples": [
|
| 178 |
{
|
| 179 |
"title": "Write an email from bullet list",
|
|
@@ -189,32 +156,26 @@ envVars:
|
|
| 189 |
}
|
| 190 |
],
|
| 191 |
"parameters": {
|
| 192 |
-
"
|
| 193 |
-
"
|
| 194 |
-
"
|
| 195 |
-
"
|
| 196 |
-
"truncate": 24576,
|
| 197 |
-
"max_new_tokens": 2048,
|
| 198 |
-
"stop": ["<|im_end|>"]
|
| 199 |
}
|
| 200 |
},
|
| 201 |
{
|
| 202 |
-
"name": "mistralai/Mistral-
|
| 203 |
-
"
|
|
|
|
| 204 |
"description": "A small model with good capabilities in language understanding and commonsense reasoning.",
|
| 205 |
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/mistral-logo.png",
|
| 206 |
-
"websiteUrl": "https://mistral.ai/news/
|
| 207 |
-
"modelUrl": "https://huggingface.co/mistralai/Mistral-
|
| 208 |
-
"tokenizer": "mistralai/Mistral-7B-Instruct-v0.3",
|
| 209 |
"preprompt": "",
|
| 210 |
"parameters": {
|
| 211 |
-
"
|
| 212 |
-
"
|
| 213 |
-
"
|
| 214 |
-
"
|
| 215 |
-
"truncate": 3072,
|
| 216 |
-
"max_new_tokens": 1024,
|
| 217 |
-
"stop": ["</s>"]
|
| 218 |
},
|
| 219 |
"promptExamples": [
|
| 220 |
{
|
|
@@ -232,18 +193,18 @@ envVars:
|
|
| 232 |
]
|
| 233 |
},
|
| 234 |
{
|
| 235 |
-
"name": "microsoft/Phi-3-mini-
|
| 236 |
-
"tokenizer": "microsoft/Phi-3-mini-
|
| 237 |
"description": "One of the best small models (3.8B parameters), super fast for simple tasks.",
|
| 238 |
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/microsoft-logo.png",
|
| 239 |
-
"modelUrl": "https://huggingface.co/microsoft/Phi-3-mini-
|
| 240 |
-
"websiteUrl": "https://
|
| 241 |
"preprompt": "",
|
| 242 |
"parameters": {
|
| 243 |
"stop": ["<|end|>", "<|endoftext|>", "<|assistant|>"],
|
| 244 |
-
"temperature": 0.
|
| 245 |
-
"
|
| 246 |
-
"
|
| 247 |
},
|
| 248 |
"promptExamples": [
|
| 249 |
{
|
|
@@ -268,7 +229,6 @@ envVars:
|
|
| 268 |
},
|
| 269 |
"parameters": {
|
| 270 |
"temperature": 0.6,
|
| 271 |
-
"top_p": 0.9,
|
| 272 |
"stop": ["<|endoftext|>", "<|eot_id|>"]
|
| 273 |
},
|
| 274 |
"unlisted": true
|
|
@@ -290,10 +250,32 @@ envVars:
|
|
| 290 |
{ "name": "meta-llama/Llama-2-70b-chat-hf" },
|
| 291 |
{ "name": "codellama/CodeLlama-70b-Instruct-hf" },
|
| 292 |
{ "name": "openchat/openchat-3.5-0106" },
|
| 293 |
-
{ "name": "meta-llama/Meta-Llama-3-70B-Instruct"},
|
| 294 |
-
{ "name": "meta-llama/Meta-Llama-3.1-405B-Instruct-FP8"},
|
| 295 |
-
{
|
| 296 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 297 |
]
|
| 298 |
PUBLIC_ORIGIN: "https://huggingface.co"
|
| 299 |
PUBLIC_SHARE_PREFIX: "https://hf.co/chat"
|
|
|
|
| 53 |
"tools": true,
|
| 54 |
"preprompt": "",
|
| 55 |
"parameters": {
|
|
|
|
|
|
|
| 56 |
"stop": ["<|endoftext|>", "<|eot_id|>"],
|
| 57 |
+
"temperature": 0.6,
|
| 58 |
"max_new_tokens": 1024,
|
| 59 |
"truncate": 7167
|
| 60 |
},
|
|
|
|
| 114 |
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/qwen-logo.png",
|
| 115 |
"preprompt": "You are Qwen, created by Alibaba Cloud. You are a helpful assistant.",
|
| 116 |
"parameters": {
|
|
|
|
| 117 |
"stop": ["<|endoftext|>", "<|im_end|>"],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 118 |
"temperature": 0.6,
|
| 119 |
+
"truncate": 28672,
|
| 120 |
+
"max_new_tokens": 3072
|
|
|
|
|
|
|
|
|
|
|
|
|
| 121 |
},
|
| 122 |
"promptExamples": [
|
| 123 |
{
|
|
|
|
| 135 |
]
|
| 136 |
},
|
| 137 |
{
|
| 138 |
+
"name": "NousResearch/Hermes-3-Llama-3.1-8B",
|
| 139 |
+
"description": "Nous Research's latest Hermes 3 release in 8B size. Follows instruction closely.",
|
| 140 |
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/nous-logo.png",
|
| 141 |
"websiteUrl": "https://nousresearch.com/",
|
| 142 |
+
"modelUrl": "https://huggingface.co/NousResearch/Hermes-3-Llama-3.1-8B",
|
| 143 |
+
"tokenizer": "NousResearch/Hermes-3-Llama-3.1-8B",
|
| 144 |
"promptExamples": [
|
| 145 |
{
|
| 146 |
"title": "Write an email from bullet list",
|
|
|
|
| 156 |
}
|
| 157 |
],
|
| 158 |
"parameters": {
|
| 159 |
+
"stop": ["<|im_end|>"],
|
| 160 |
+
"temperature": 0.6,
|
| 161 |
+
"truncate": 14336,
|
| 162 |
+
"max_new_tokens": 1536
|
|
|
|
|
|
|
|
|
|
| 163 |
}
|
| 164 |
},
|
| 165 |
{
|
| 166 |
+
"name": "mistralai/Mistral-Nemo-Instruct-2407",
|
| 167 |
+
"tokenizer": "mistralai/Mistral-Nemo-Instruct-2407",
|
| 168 |
+
"displayName": "mistralai/Mistral-Nemo-Instruct-2407",
|
| 169 |
"description": "A small model with good capabilities in language understanding and commonsense reasoning.",
|
| 170 |
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/mistral-logo.png",
|
| 171 |
+
"websiteUrl": "https://mistral.ai/news/mistral-nemo/",
|
| 172 |
+
"modelUrl": "https://huggingface.co/mistralai/Mistral-Nemo-Instruct-2407",
|
|
|
|
| 173 |
"preprompt": "",
|
| 174 |
"parameters": {
|
| 175 |
+
"stop": ["</s>"],
|
| 176 |
+
"temperature": 0.6,
|
| 177 |
+
"truncate": 14336,
|
| 178 |
+
"max_new_tokens": 1536
|
|
|
|
|
|
|
|
|
|
| 179 |
},
|
| 180 |
"promptExamples": [
|
| 181 |
{
|
|
|
|
| 193 |
]
|
| 194 |
},
|
| 195 |
{
|
| 196 |
+
"name": "microsoft/Phi-3.5-mini-instruct",
|
| 197 |
+
"tokenizer": "microsoft/Phi-3.5-mini-instruct",
|
| 198 |
"description": "One of the best small models (3.8B parameters), super fast for simple tasks.",
|
| 199 |
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/microsoft-logo.png",
|
| 200 |
+
"modelUrl": "https://huggingface.co/microsoft/Phi-3.5-mini-instruct",
|
| 201 |
+
"websiteUrl": "https://techcommunity.microsoft.com/t5/ai-azure-ai-services-blog/discover-the-new-multi-lingual-high-quality-phi-3-5-slms/ba-p/4225280/",
|
| 202 |
"preprompt": "",
|
| 203 |
"parameters": {
|
| 204 |
"stop": ["<|end|>", "<|endoftext|>", "<|assistant|>"],
|
| 205 |
+
"temperature": 0.6,
|
| 206 |
+
"truncate": 28672,
|
| 207 |
+
"max_new_tokens": 3072
|
| 208 |
},
|
| 209 |
"promptExamples": [
|
| 210 |
{
|
|
|
|
| 229 |
},
|
| 230 |
"parameters": {
|
| 231 |
"temperature": 0.6,
|
|
|
|
| 232 |
"stop": ["<|endoftext|>", "<|eot_id|>"]
|
| 233 |
},
|
| 234 |
"unlisted": true
|
|
|
|
| 250 |
{ "name": "meta-llama/Llama-2-70b-chat-hf" },
|
| 251 |
{ "name": "codellama/CodeLlama-70b-Instruct-hf" },
|
| 252 |
{ "name": "openchat/openchat-3.5-0106" },
|
| 253 |
+
{ "name": "meta-llama/Meta-Llama-3-70B-Instruct" },
|
| 254 |
+
{ "name": "meta-llama/Meta-Llama-3.1-405B-Instruct-FP8" },
|
| 255 |
+
{
|
| 256 |
+
"name": "CohereForAI/c4ai-command-r-plus",
|
| 257 |
+
"transferTo": "CohereForAI/c4ai-command-r-plus-08-2024"
|
| 258 |
+
},
|
| 259 |
+
{
|
| 260 |
+
"name": "01-ai/Yi-1.5-34B-Chat",
|
| 261 |
+
"transferTo": "CohereForAI/c4ai-command-r-plus-08-2024"
|
| 262 |
+
},
|
| 263 |
+
{
|
| 264 |
+
"name": "mistralai/Mixtral-8x7B-Instruct-v0.1",
|
| 265 |
+
"transferTo": "mistralai/Mistral-Nemo-Instruct-2407"
|
| 266 |
+
},
|
| 267 |
+
{
|
| 268 |
+
"name": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
|
| 269 |
+
"transferTo": "NousResearch/Hermes-3-Llama-3.1-8B"
|
| 270 |
+
},
|
| 271 |
+
{
|
| 272 |
+
"name": "mistralai/Mistral-7B-Instruct-v0.3",
|
| 273 |
+
"transferTo": "mistralai/Mistral-Nemo-Instruct-2407"
|
| 274 |
+
},
|
| 275 |
+
{
|
| 276 |
+
"name": "microsoft/Phi-3-mini-4k-instruct",
|
| 277 |
+
"transferTo": "microsoft/Phi-3.5-mini-instruct"
|
| 278 |
+
}
|
| 279 |
]
|
| 280 |
PUBLIC_ORIGIN: "https://huggingface.co"
|
| 281 |
PUBLIC_SHARE_PREFIX: "https://hf.co/chat"
|