Spaces:
Running
on
Inf2
Running
on
Inf2
feat(hchat): move Llama 3.3 70B as the default model
Browse files- chart/env/prod.yaml +21 -21
chart/env/prod.yaml
CHANGED
|
@@ -45,19 +45,20 @@ envVars:
|
|
| 45 |
MODELS: >
|
| 46 |
[
|
| 47 |
{
|
| 48 |
-
"name": "
|
| 49 |
-
"
|
| 50 |
-
"
|
| 51 |
-
"
|
| 52 |
-
"
|
| 53 |
-
"
|
|
|
|
|
|
|
| 54 |
"parameters": {
|
| 55 |
-
"stop": ["<|endoftext|>", "<|
|
| 56 |
"temperature": 0.6,
|
| 57 |
-
"
|
| 58 |
-
"
|
| 59 |
},
|
| 60 |
-
"tools": true,
|
| 61 |
"promptExamples": [
|
| 62 |
{
|
| 63 |
"title": "Write an email from bullet list",
|
|
@@ -74,20 +75,19 @@ envVars:
|
|
| 74 |
]
|
| 75 |
},
|
| 76 |
{
|
| 77 |
-
"name": "
|
| 78 |
-
"
|
| 79 |
-
"
|
| 80 |
-
"
|
| 81 |
-
"
|
| 82 |
-
"
|
| 83 |
-
"tools": true,
|
| 84 |
-
"preprompt": "",
|
| 85 |
"parameters": {
|
| 86 |
-
"stop": ["<|endoftext|>", "<|
|
| 87 |
"temperature": 0.6,
|
| 88 |
-
"
|
| 89 |
-
"
|
| 90 |
},
|
|
|
|
| 91 |
"promptExamples": [
|
| 92 |
{
|
| 93 |
"title": "Write an email from bullet list",
|
|
|
|
| 45 |
MODELS: >
|
| 46 |
[
|
| 47 |
{
|
| 48 |
+
"name": "meta-llama/Llama-3.3-70B-Instruct",
|
| 49 |
+
"id": "meta-llama/Llama-3.3-70B-Instruct",
|
| 50 |
+
"description": "Ideal for everyday use. A fast and extremely capable model matching closed source models' capabilities. Now with the latest Llama 3.3 weights!",
|
| 51 |
+
"modelUrl": "https://huggingface.co/meta-llama/Llama-3.3-70B-Instruct",
|
| 52 |
+
"websiteUrl": "https://llama.meta.com/",
|
| 53 |
+
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/meta-logo.png",
|
| 54 |
+
"tools": true,
|
| 55 |
+
"preprompt": "",
|
| 56 |
"parameters": {
|
| 57 |
+
"stop": ["<|endoftext|>", "<|eot_id|>"],
|
| 58 |
"temperature": 0.6,
|
| 59 |
+
"max_new_tokens": 1024,
|
| 60 |
+
"truncate": 7167
|
| 61 |
},
|
|
|
|
| 62 |
"promptExamples": [
|
| 63 |
{
|
| 64 |
"title": "Write an email from bullet list",
|
|
|
|
| 75 |
]
|
| 76 |
},
|
| 77 |
{
|
| 78 |
+
"name": "Qwen/Qwen2.5-72B-Instruct",
|
| 79 |
+
"description": "The latest Qwen open model with improved role-playing, long text generation and structured data understanding.",
|
| 80 |
+
"modelUrl": "https://huggingface.co/Qwen/Qwen2.5-72B-Instruct",
|
| 81 |
+
"websiteUrl": "https://qwenlm.github.io/blog/qwen2.5/",
|
| 82 |
+
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/qwen-logo.png",
|
| 83 |
+
"preprompt": "You are Qwen, created by Alibaba Cloud. You are a helpful assistant.",
|
|
|
|
|
|
|
| 84 |
"parameters": {
|
| 85 |
+
"stop": ["<|endoftext|>", "<|im_end|>"],
|
| 86 |
"temperature": 0.6,
|
| 87 |
+
"truncate": 28672,
|
| 88 |
+
"max_new_tokens": 3072
|
| 89 |
},
|
| 90 |
+
"tools": true,
|
| 91 |
"promptExamples": [
|
| 92 |
{
|
| 93 |
"title": "Write an email from bullet list",
|