van-qa commited on
Commit
9f1234d
·
verified ·
1 Parent(s): c3e8766

Update model.yml

Browse files
Files changed (1) hide show
  1. model.yml +2 -17
model.yml CHANGED
@@ -3,22 +3,7 @@ model: nomic-embed-text-v1:Q8_0
3
  version: 1
4
  model_type: 'embedding' # 'embedding' | 'llm'
5
 
6
- # Results Preferences
7
- stop:
8
- - '[SEP]'
9
- top_p: 0.7
10
- temperature: 0.7
11
- frequency_penalty: 0.7
12
- presence_penalty: 0.7
13
- max_tokens: 4098 # Infer from base config.json -> max_position_embeddings
14
- stream: true # true | false
15
-
16
  # Engine / Model Settings
17
  ngl: 100 # Infer from base config.json -> num_attention_heads
18
- ctx_len: 4096 # Infer from base config.json -> max_position_embeddings
19
- engine: cortex.llamacpp
20
- prompt_template: |-
21
- [INST] <<SYS>>
22
- {system_message}
23
- <</SYS>>
24
- {prompt}[/INST]
 
3
  version: 1
4
  model_type: 'embedding' # 'embedding' | 'llm'
5
 
 
 
 
 
 
 
 
 
 
 
6
  # Engine / Model Settings
7
  ngl: 100 # Infer from base config.json -> num_attention_heads
8
+ ctx_len: 8192 # Infer from base config.json -> max_position_embeddings
9
+ engine: cortex.llamacpp