Update README.md
Browse files
README.md
CHANGED
@@ -4,3 +4,23 @@ base_model: Felladrin/TinyMistral-248M-Chat-v2
|
|
4 |
---
|
5 |
|
6 |
GGUF version of [Felladrin/TinyMistral-248M-Chat-v2](https://huggingface.co/Felladrin/TinyMistral-248M-Chat-v2).
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4 |
---
|
5 |
|
6 |
GGUF version of [Felladrin/TinyMistral-248M-Chat-v2](https://huggingface.co/Felladrin/TinyMistral-248M-Chat-v2).
|
7 |
+
|
8 |
+
## Usage with llama.cpp
|
9 |
+
|
10 |
+
```bash
|
11 |
+
brew install ggerganov/ggerganov/llama.cpp
|
12 |
+
```
|
13 |
+
|
14 |
+
```bash
|
15 |
+
llama-cli \
|
16 |
+
--hf-repo Felladrin/gguf-TinyMistral-248M-Chat-v2 \
|
17 |
+
--model TinyMistral-248M-Chat-v2.Q8_0.gguf \
|
18 |
+
-p "<|im_start|>system\nYou are a helpful assistant who answers user's questions with details and curiosity.<|im_end|>\n<|im_start|>user\nWhat are some potential applications for quantum computing?<|im_end|>\n<|im_start|>assistant\n" \
|
19 |
+
-e \
|
20 |
+
--dynatemp-range "0.1-0.35" \
|
21 |
+
--min-p 0.05 \
|
22 |
+
--repeat-penalty 1.1 \
|
23 |
+
-c 2048 \
|
24 |
+
-n 250 \
|
25 |
+
-r "<|im_end|>"
|
26 |
+
```
|