johnbridges commited on
Commit
4085ccc
·
1 Parent(s): c89e475

Sync Dockerfile/secrets setup

Browse files
Files changed (2) hide show
  1. Dockerfile +1 -1
  2. appsettings.json +5 -5
Dockerfile CHANGED
@@ -33,7 +33,7 @@ WORKDIR /home/user
33
  RUN mkdir -p /home/user/code/models && \
34
  mkdir -p /home/user/code/app/wwwroot && \
35
  cd /home/user/code/models && \
36
- wget -q https://huggingface.co/Mungert/Qwen3-4B-Instruct-2507-GGUF/resolve/main/Qwen3-4B-Instruct-2507-q8_0.gguf
37
 
38
 
39
  # Clone and build OpenBLAS as the non-root user
 
33
  RUN mkdir -p /home/user/code/models && \
34
  mkdir -p /home/user/code/app/wwwroot && \
35
  cd /home/user/code/models && \
36
+ wget -q https://huggingface.co/Mungert/Qwen3.5-2B-GGUF/resolve/main/Qwen3.5-2B-q6_k_m.gguf
37
 
38
 
39
  # Clone and build OpenBLAS as the non-root user
appsettings.json CHANGED
@@ -25,11 +25,11 @@
25
  "LlmNoInitMessage": true,
26
  "ServiceAuthKey": ".env",
27
  "LlmModelPath": "/home/user/code/models/",
28
- "LlmModelFileName": "Qwen3-4B-Instruct-2507-q8_0.gguf",
29
- "LlmContextFileName": "context-qwen-3.gguf",
30
- "LlmSystemPrompt": "system_prompt_qwen_3_run",
31
  "LlmPromptMode": " -if -sp -no-cnv --simple-io ",
32
- "LlmVersion": "qwen_3",
33
  "LlmCtxSize": 12000,
34
  "LlmOpenAICtxSize": 32000,
35
  "LlmCtxRatio": 6,
@@ -65,7 +65,7 @@
65
  "Enabled": true,
66
  "Type": "Http",
67
  "BaseUrl": "https://cachehttp.readyforquantum.com/api",
68
- "ApiKey": ".env",
69
  "TimeoutSeconds": 600,
70
  "RetryAttempts": 3
71
  }
 
25
  "LlmNoInitMessage": true,
26
  "ServiceAuthKey": ".env",
27
  "LlmModelPath": "/home/user/code/models/",
28
+ "LlmModelFileName": "Qwen3.5-2B-q6_k_m.gguf",
29
+ "LlmContextFileName": "context-qwen-3_5.gguf",
30
+ "LlmSystemPrompt": "system_prompt_qwen_3_5_run",
31
  "LlmPromptMode": " -if -sp -no-cnv --simple-io ",
32
+ "LlmVersion": "qwen_3.5",
33
  "LlmCtxSize": 12000,
34
  "LlmOpenAICtxSize": 32000,
35
  "LlmCtxRatio": 6,
 
65
  "Enabled": true,
66
  "Type": "Http",
67
  "BaseUrl": "https://cachehttp.readyforquantum.com/api",
68
+ "API_KEY": ".env",
69
  "TimeoutSeconds": 600,
70
  "RetryAttempts": 3
71
  }