Commit ·
4085ccc
1
Parent(s): c89e475
Sync Dockerfile/secrets setup
Browse files- Dockerfile +1 -1
- appsettings.json +5 -5
Dockerfile
CHANGED
|
@@ -33,7 +33,7 @@ WORKDIR /home/user
|
|
| 33 |
RUN mkdir -p /home/user/code/models && \
|
| 34 |
mkdir -p /home/user/code/app/wwwroot && \
|
| 35 |
cd /home/user/code/models && \
|
| 36 |
-
wget -q https://huggingface.co/Mungert/Qwen3-
|
| 37 |
|
| 38 |
|
| 39 |
# Clone and build OpenBLAS as the non-root user
|
|
|
|
| 33 |
RUN mkdir -p /home/user/code/models && \
|
| 34 |
mkdir -p /home/user/code/app/wwwroot && \
|
| 35 |
cd /home/user/code/models && \
|
| 36 |
+
wget -q https://huggingface.co/Mungert/Qwen3.5-2B-GGUF/resolve/main/Qwen3.5-2B-q6_k_m.gguf
|
| 37 |
|
| 38 |
|
| 39 |
# Clone and build OpenBLAS as the non-root user
|
appsettings.json
CHANGED
|
@@ -25,11 +25,11 @@
|
|
| 25 |
"LlmNoInitMessage": true,
|
| 26 |
"ServiceAuthKey": ".env",
|
| 27 |
"LlmModelPath": "/home/user/code/models/",
|
| 28 |
-
"LlmModelFileName": "Qwen3-
|
| 29 |
-
"LlmContextFileName": "context-qwen-
|
| 30 |
-
"LlmSystemPrompt": "
|
| 31 |
"LlmPromptMode": " -if -sp -no-cnv --simple-io ",
|
| 32 |
-
"LlmVersion": "qwen_3",
|
| 33 |
"LlmCtxSize": 12000,
|
| 34 |
"LlmOpenAICtxSize": 32000,
|
| 35 |
"LlmCtxRatio": 6,
|
|
@@ -65,7 +65,7 @@
|
|
| 65 |
"Enabled": true,
|
| 66 |
"Type": "Http",
|
| 67 |
"BaseUrl": "https://cachehttp.readyforquantum.com/api",
|
| 68 |
-
"
|
| 69 |
"TimeoutSeconds": 600,
|
| 70 |
"RetryAttempts": 3
|
| 71 |
}
|
|
|
|
| 25 |
"LlmNoInitMessage": true,
|
| 26 |
"ServiceAuthKey": ".env",
|
| 27 |
"LlmModelPath": "/home/user/code/models/",
|
| 28 |
+
"LlmModelFileName": "Qwen3.5-2B-q6_k_m.gguf",
|
| 29 |
+
"LlmContextFileName": "context-qwen-3_5.gguf",
|
| 30 |
+
"LlmSystemPrompt": "system_prompt_qwen_3_5_run",
|
| 31 |
"LlmPromptMode": " -if -sp -no-cnv --simple-io ",
|
| 32 |
+
"LlmVersion": "qwen_3.5",
|
| 33 |
"LlmCtxSize": 12000,
|
| 34 |
"LlmOpenAICtxSize": 32000,
|
| 35 |
"LlmCtxRatio": 6,
|
|
|
|
| 65 |
"Enabled": true,
|
| 66 |
"Type": "Http",
|
| 67 |
"BaseUrl": "https://cachehttp.readyforquantum.com/api",
|
| 68 |
+
"API_KEY": ".env",
|
| 69 |
"TimeoutSeconds": 600,
|
| 70 |
"RetryAttempts": 3
|
| 71 |
}
|