Update model.yml
Browse files
model.yml
CHANGED
@@ -3,22 +3,7 @@ model: nomic-embed-text-v1:Q8_0
|
|
3 |
version: 1
|
4 |
model_type: 'embedding' # 'embedding' | 'llm'
|
5 |
|
6 |
-
# Results Preferences
|
7 |
-
stop:
|
8 |
-
- '[SEP]'
|
9 |
-
top_p: 0.7
|
10 |
-
temperature: 0.7
|
11 |
-
frequency_penalty: 0.7
|
12 |
-
presence_penalty: 0.7
|
13 |
-
max_tokens: 4098 # Infer from base config.json -> max_position_embeddings
|
14 |
-
stream: true # true | false
|
15 |
-
|
16 |
# Engine / Model Settings
|
17 |
ngl: 100 # Infer from base config.json -> num_attention_heads
|
18 |
-
ctx_len:
|
19 |
-
engine: cortex.llamacpp
|
20 |
-
prompt_template: |-
|
21 |
-
[INST] <<SYS>>
|
22 |
-
{system_message}
|
23 |
-
<</SYS>>
|
24 |
-
{prompt}[/INST]
|
|
|
3 |
version: 1
|
4 |
model_type: 'embedding' # 'embedding' | 'llm'
|
5 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6 |
# Engine / Model Settings
|
7 |
ngl: 100 # Infer from base config.json -> num_attention_heads
|
8 |
+
ctx_len: 8192 # Infer from base config.json -> max_position_embeddings
|
9 |
+
engine: cortex.llamacpp
|
|
|
|
|
|
|
|
|
|