Upload model.yml with huggingface_hub
Browse files
model.yml
ADDED
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# BEGIN GENERAL GGUF METADATA
|
2 |
+
id: amd-olmo
|
3 |
+
model: amd-olmo
|
4 |
+
name: amd-olmo
|
5 |
+
version: 1
|
6 |
+
# END GENERAL GGUF METADATA
|
7 |
+
|
8 |
+
# BEGIN INFERENCE PARAMETERS
|
9 |
+
# BEGIN REQUIRED
|
10 |
+
stop:
|
11 |
+
- <|im_end|>
|
12 |
+
# END REQUIRED
|
13 |
+
|
14 |
+
# BEGIN OPTIONAL
|
15 |
+
stream: true
|
16 |
+
top_p: 0.9
|
17 |
+
temperature: 0.7
|
18 |
+
frequency_penalty: 0
|
19 |
+
presence_penalty: 0
|
20 |
+
max_tokens: 4096
|
21 |
+
seed: -1
|
22 |
+
dynatemp_range: 0
|
23 |
+
dynatemp_exponent: 1
|
24 |
+
top_k: 40
|
25 |
+
min_p: 0.05
|
26 |
+
tfs_z: 1
|
27 |
+
typ_p: 1
|
28 |
+
repeat_last_n: 64
|
29 |
+
repeat_penalty: 1
|
30 |
+
mirostat: false
|
31 |
+
mirostat_tau: 5
|
32 |
+
mirostat_eta: 0.100000001
|
33 |
+
penalize_nl: false
|
34 |
+
ignore_eos: false
|
35 |
+
n_probs: 0
|
36 |
+
min_keep: 0
|
37 |
+
# END OPTIONAL
|
38 |
+
# END INFERENCE PARAMETERS
|
39 |
+
|
40 |
+
# BEGIN MODEL LOAD PARAMETERS
|
41 |
+
# BEGIN REQUIRED
|
42 |
+
engine: llama-cpp
|
43 |
+
prompt_template: <|im_start|>system\n{system_message}<|im_end|>\n<|im_start|>user\n{prompt}<|im_end|>\n<|im_start|>assistant\n
|
44 |
+
ctx_len: 4096
|
45 |
+
ngl: 34
|
46 |
+
# END REQUIRED
|
47 |
+
# END MODEL LOAD PARAMETERS
|