Cartinoe5930 commited on
Commit
cf97a0a
1 Parent(s): 428a5ee

Upload folder using huggingface_hub

Browse files
README.md ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - merge
4
+ - mergekit
5
+ - lazymergekit
6
+ - lmsys/vicuna-13b-v1.5
7
+ - OpenAssistant/llama2-13b-orca-8k-3319
8
+ base_model:
9
+ - lmsys/vicuna-13b-v1.5
10
+ - OpenAssistant/llama2-13b-orca-8k-3319
11
+ ---
12
+
13
+ # vicuna-orac
14
+
15
+ vicuna-orac is a merge of the following models using [LazyMergekit](https://colab.research.google.com/drive/1obulZ1ROXHjYLn6PPZJwRR6GzgQogxxb?usp=sharing):
16
+ * [lmsys/vicuna-13b-v1.5](https://huggingface.co/lmsys/vicuna-13b-v1.5)
17
+ * [OpenAssistant/llama2-13b-orca-8k-3319](https://huggingface.co/OpenAssistant/llama2-13b-orca-8k-3319)
18
+
19
+ ## 🧩 Configuration
20
+
21
+ ```yaml
22
+ models:
23
+ - model: lmsys/vicuna-13b-v1.5
24
+ parameters:
25
+ weight: 0.5
26
+ - model: OpenAssistant/llama2-13b-orca-8k-3319
27
+ parameters:
28
+ weight: 0.5
29
+ merge_method: linear
30
+ dtype: bfloat16
31
+ ```
32
+
33
+ ## 💻 Usage
34
+
35
+ ```python
36
+ !pip install -qU transformers accelerate
37
+
38
+ from transformers import AutoTokenizer
39
+ import transformers
40
+ import torch
41
+
42
+ model = "Cartinoe5930/vicuna-orac"
43
+ messages = [{"role": "user", "content": "What is a large language model?"}]
44
+
45
+ tokenizer = AutoTokenizer.from_pretrained(model)
46
+ prompt = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
47
+ pipeline = transformers.pipeline(
48
+ "text-generation",
49
+ model=model,
50
+ torch_dtype=torch.float16,
51
+ device_map="auto",
52
+ )
53
+
54
+ outputs = pipeline(prompt, max_new_tokens=256, do_sample=True, temperature=0.7, top_k=50, top_p=0.95)
55
+ print(outputs[0]["generated_text"])
56
+ ```
added_tokens.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<pad>": 32000,
3
+ "<|assistant|>": 32001,
4
+ "<|prefix_begin|>": 32004,
5
+ "<|prefix_end|>": 32002,
6
+ "<|prompter|>": 32005,
7
+ "<|system|>": 32003
8
+ }
config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "OpenAssistant/llama2-13b-orca-8k-3319",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 5120,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 13824,
14
+ "max_length": 8192,
15
+ "max_position_embeddings": 8192,
16
+ "mlp_bias": false,
17
+ "model_type": "llama",
18
+ "num_attention_heads": 40,
19
+ "num_hidden_layers": 40,
20
+ "num_key_value_heads": 40,
21
+ "pad_token_id": 0,
22
+ "pretraining_tp": 1,
23
+ "rms_norm_eps": 1e-05,
24
+ "rope_scaling": {
25
+ "factor": 2.0,
26
+ "type": "linear"
27
+ },
28
+ "rope_theta": 10000.0,
29
+ "tie_word_embeddings": false,
30
+ "torch_dtype": "bfloat16",
31
+ "transformers_version": "4.41.1",
32
+ "use_cache": true,
33
+ "vocab_size": 32016
34
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ models:
3
+ - model: lmsys/vicuna-13b-v1.5
4
+ parameters:
5
+ weight: 0.5
6
+ - model: OpenAssistant/llama2-13b-orca-8k-3319
7
+ parameters:
8
+ weight: 0.5
9
+ merge_method: linear
10
+ dtype: bfloat16
model-00001-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed43984cbb4e33724d87cef9dde299f5329821c72a1ebd3df055e7859d94e855
3
+ size 938486328
model-00002-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c02e045dcf7df4317e79e008f9d752c625978eb7eb6376f201919dd93b3a220
3
+ size 985704256
model-00003-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed754486a5ab7852dcfca773d71d5409d31cf2fc28ee1b69c6202316ef5baa15
3
+ size 917525776
model-00004-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d68a1688a4ca0a3184d93ff3f80e28c7f1816584539f6141fd753934a1ab911
3
+ size 985704272
model-00005-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ee38af3e608217e920aed47be300a9526c7df3798a6426567ce4bba0fc09936
3
+ size 917525776
model-00006-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc38ac265aff41f3fb4b6d368195b8873bcf4e06ad0c7c0fd5b3d54a85658e56
3
+ size 985704272
model-00007-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d293eb9fe2b4b309e53f3662d6840cd89204e9ede986e52a06a4734a98af1076
3
+ size 917525776
model-00008-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cda4cf2c6fccb4229b995fd488a6c667dafe90a6eb1da666a8c663cd12b1fc0
3
+ size 985704272
model-00009-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7985e486a36c296c6a8cd7b5d8cc159added07e51d41d094bea7c71831e9b2d9
3
+ size 917525776
model-00010-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd9321e5d9b567620607bb7c2d31cc1b7215c26ac9c40ffe7f6576862b75e763
3
+ size 985704264
model-00011-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7832cf8c3fa13bdfa495f49154446eb9acb8759ae3633fdb232e316a4db186db
3
+ size 917525776
model-00012-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8454aea183774b09a71a85288f6282bfa20d8983e08143bcafac151b82e7893a
3
+ size 985704272
model-00013-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6370d7a58598a769dd522c9e3c6561e04bbf0996aeafd92daf3c74db8c806fc6
3
+ size 917525776
model-00014-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f766eea00d6bfd874ee821c6bc37b8d38b5b6da4a80abf0ccd87cbadffce57b
3
+ size 985704272
model-00015-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d112080529655bb824873fff563feb5b9b352633708b07b944e94207ce81e8ca
3
+ size 917525776
model-00016-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d583fd48b193e9249ced603c6a74c12ed1f28ebc08b20927aceb0f7f9f14070
3
+ size 985704272
model-00017-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19b3794436ad73e2bebf287cd6e99c92c1f0e7d14f60a01620eb4a9ebef40760
3
+ size 917525768
model-00018-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:809d3f4783333ad6c085b269353d9d30c89356f2d2f66a041f63308d2e0d32ec
3
+ size 985704272
model-00019-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e344bec9efeaa9b0701d498d89bbebe471196df4786ffff1f8800baa17b74e9f
3
+ size 917525776
model-00020-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be0b28b7cd15c73b656a470cbd3fa6a2b1ca4374bfb55c95675844408e84956c
3
+ size 985704272
model-00021-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c54a3aa5ff83ddc463ed319372f4e39b82ea5e219089253659984f8d92d90295
3
+ size 917525776
model-00022-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ebbff4591e59d1f501e5d24ec38ec23f37f12f7033ef8954138a8a9c1024d2d
3
+ size 985704272
model-00023-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:885317d031c88403dc4f9b968705bf623e99f14a0632107823a40037a761b9cf
3
+ size 917525776
model-00024-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0b417a7a888ef239a7662bb3244194814184cca7bec8664122675bc2b1fe6e6
3
+ size 985704264
model-00025-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f89022b6503f312876b5be3c9fcb7837eb1b58ff60f79bb1925827ec57833d96
3
+ size 917525768
model-00026-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2eaf32b9cb77663103125207bb06d9a2ef8dbfa83b6356e9612a62ff2af7086
3
+ size 985704256
model-00027-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0267bb0a701705d8f05ecfa5ae0843cdd24f971b25ca50d34015cf79cfdb5098
3
+ size 917525768
model-00028-of-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3790abc4b528c8cb1f550312103e767e617812c0a5a6078bd41d1a370208a69
3
+ size 351294256
model.safetensors.index.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"metadata": {"mergekit_version": "0.0.4.2", "total_size": 26031728640}, "weight_map": {"lm_head.weight": "model-00001-of-00028.safetensors", "model.embed_tokens.weight": "model-00001-of-00028.safetensors", "model.layers.0.input_layernorm.weight": "model-00001-of-00028.safetensors", "model.layers.0.mlp.down_proj.weight": "model-00001-of-00028.safetensors", "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00028.safetensors", "model.layers.0.mlp.up_proj.weight": "model-00002-of-00028.safetensors", "model.layers.0.post_attention_layernorm.weight": "model-00002-of-00028.safetensors", "model.layers.0.self_attn.k_proj.weight": "model-00002-of-00028.safetensors", "model.layers.0.self_attn.o_proj.weight": "model-00002-of-00028.safetensors", "model.layers.0.self_attn.q_proj.weight": "model-00002-of-00028.safetensors", "model.layers.0.self_attn.v_proj.weight": "model-00002-of-00028.safetensors", "model.layers.1.input_layernorm.weight": "model-00002-of-00028.safetensors", "model.layers.1.mlp.down_proj.weight": "model-00002-of-00028.safetensors", "model.layers.1.mlp.gate_proj.weight": "model-00002-of-00028.safetensors", "model.layers.1.mlp.up_proj.weight": "model-00002-of-00028.safetensors", "model.layers.1.post_attention_layernorm.weight": "model-00002-of-00028.safetensors", "model.layers.1.self_attn.k_proj.weight": "model-00002-of-00028.safetensors", "model.layers.1.self_attn.o_proj.weight": "model-00002-of-00028.safetensors", "model.layers.1.self_attn.q_proj.weight": "model-00002-of-00028.safetensors", "model.layers.1.self_attn.v_proj.weight": "model-00002-of-00028.safetensors", "model.layers.10.input_layernorm.weight": "model-00002-of-00028.safetensors", "model.layers.10.mlp.down_proj.weight": "model-00003-of-00028.safetensors", "model.layers.10.mlp.gate_proj.weight": "model-00003-of-00028.safetensors", "model.layers.10.mlp.up_proj.weight": "model-00003-of-00028.safetensors", "model.layers.10.post_attention_layernorm.weight": "model-00003-of-00028.safetensors", "model.layers.10.self_attn.k_proj.weight": "model-00003-of-00028.safetensors", "model.layers.10.self_attn.o_proj.weight": "model-00003-of-00028.safetensors", "model.layers.10.self_attn.q_proj.weight": "model-00003-of-00028.safetensors", "model.layers.10.self_attn.v_proj.weight": "model-00003-of-00028.safetensors", "model.layers.11.input_layernorm.weight": "model-00003-of-00028.safetensors", "model.layers.11.mlp.down_proj.weight": "model-00003-of-00028.safetensors", "model.layers.11.mlp.gate_proj.weight": "model-00003-of-00028.safetensors", "model.layers.11.mlp.up_proj.weight": "model-00004-of-00028.safetensors", "model.layers.11.post_attention_layernorm.weight": "model-00004-of-00028.safetensors", "model.layers.11.self_attn.k_proj.weight": "model-00004-of-00028.safetensors", "model.layers.11.self_attn.o_proj.weight": "model-00004-of-00028.safetensors", "model.layers.11.self_attn.q_proj.weight": "model-00004-of-00028.safetensors", "model.layers.11.self_attn.v_proj.weight": "model-00004-of-00028.safetensors", "model.layers.12.input_layernorm.weight": "model-00004-of-00028.safetensors", "model.layers.12.mlp.down_proj.weight": "model-00004-of-00028.safetensors", "model.layers.12.mlp.gate_proj.weight": "model-00004-of-00028.safetensors", "model.layers.12.mlp.up_proj.weight": "model-00004-of-00028.safetensors", "model.layers.12.post_attention_layernorm.weight": "model-00004-of-00028.safetensors", "model.layers.12.self_attn.k_proj.weight": "model-00004-of-00028.safetensors", "model.layers.12.self_attn.o_proj.weight": "model-00004-of-00028.safetensors", "model.layers.12.self_attn.q_proj.weight": "model-00004-of-00028.safetensors", "model.layers.12.self_attn.v_proj.weight": "model-00004-of-00028.safetensors", "model.layers.13.input_layernorm.weight": "model-00004-of-00028.safetensors", "model.layers.13.mlp.down_proj.weight": "model-00005-of-00028.safetensors", "model.layers.13.mlp.gate_proj.weight": "model-00005-of-00028.safetensors", "model.layers.13.mlp.up_proj.weight": "model-00005-of-00028.safetensors", "model.layers.13.post_attention_layernorm.weight": "model-00005-of-00028.safetensors", "model.layers.13.self_attn.k_proj.weight": "model-00005-of-00028.safetensors", "model.layers.13.self_attn.o_proj.weight": "model-00005-of-00028.safetensors", "model.layers.13.self_attn.q_proj.weight": "model-00005-of-00028.safetensors", "model.layers.13.self_attn.v_proj.weight": "model-00005-of-00028.safetensors", "model.layers.14.input_layernorm.weight": "model-00005-of-00028.safetensors", "model.layers.14.mlp.down_proj.weight": "model-00005-of-00028.safetensors", "model.layers.14.mlp.gate_proj.weight": "model-00005-of-00028.safetensors", "model.layers.14.mlp.up_proj.weight": "model-00006-of-00028.safetensors", "model.layers.14.post_attention_layernorm.weight": "model-00006-of-00028.safetensors", "model.layers.14.self_attn.k_proj.weight": "model-00006-of-00028.safetensors", "model.layers.14.self_attn.o_proj.weight": "model-00006-of-00028.safetensors", "model.layers.14.self_attn.q_proj.weight": "model-00006-of-00028.safetensors", "model.layers.14.self_attn.v_proj.weight": "model-00006-of-00028.safetensors", "model.layers.15.input_layernorm.weight": "model-00006-of-00028.safetensors", "model.layers.15.mlp.down_proj.weight": "model-00006-of-00028.safetensors", "model.layers.15.mlp.gate_proj.weight": "model-00006-of-00028.safetensors", "model.layers.15.mlp.up_proj.weight": "model-00006-of-00028.safetensors", "model.layers.15.post_attention_layernorm.weight": "model-00006-of-00028.safetensors", "model.layers.15.self_attn.k_proj.weight": "model-00006-of-00028.safetensors", "model.layers.15.self_attn.o_proj.weight": "model-00006-of-00028.safetensors", "model.layers.15.self_attn.q_proj.weight": "model-00006-of-00028.safetensors", "model.layers.15.self_attn.v_proj.weight": "model-00006-of-00028.safetensors", "model.layers.16.input_layernorm.weight": "model-00006-of-00028.safetensors", "model.layers.16.mlp.down_proj.weight": "model-00007-of-00028.safetensors", "model.layers.16.mlp.gate_proj.weight": "model-00007-of-00028.safetensors", "model.layers.16.mlp.up_proj.weight": "model-00007-of-00028.safetensors", "model.layers.16.post_attention_layernorm.weight": "model-00007-of-00028.safetensors", "model.layers.16.self_attn.k_proj.weight": "model-00007-of-00028.safetensors", "model.layers.16.self_attn.o_proj.weight": "model-00007-of-00028.safetensors", "model.layers.16.self_attn.q_proj.weight": "model-00007-of-00028.safetensors", "model.layers.16.self_attn.v_proj.weight": "model-00007-of-00028.safetensors", "model.layers.17.input_layernorm.weight": "model-00007-of-00028.safetensors", "model.layers.17.mlp.down_proj.weight": "model-00007-of-00028.safetensors", "model.layers.17.mlp.gate_proj.weight": "model-00007-of-00028.safetensors", "model.layers.17.mlp.up_proj.weight": "model-00008-of-00028.safetensors", "model.layers.17.post_attention_layernorm.weight": "model-00008-of-00028.safetensors", "model.layers.17.self_attn.k_proj.weight": "model-00008-of-00028.safetensors", "model.layers.17.self_attn.o_proj.weight": "model-00008-of-00028.safetensors", "model.layers.17.self_attn.q_proj.weight": "model-00008-of-00028.safetensors", "model.layers.17.self_attn.v_proj.weight": "model-00008-of-00028.safetensors", "model.layers.18.input_layernorm.weight": "model-00008-of-00028.safetensors", "model.layers.18.mlp.down_proj.weight": "model-00008-of-00028.safetensors", "model.layers.18.mlp.gate_proj.weight": "model-00008-of-00028.safetensors", "model.layers.18.mlp.up_proj.weight": "model-00008-of-00028.safetensors", "model.layers.18.post_attention_layernorm.weight": "model-00008-of-00028.safetensors", "model.layers.18.self_attn.k_proj.weight": "model-00008-of-00028.safetensors", "model.layers.18.self_attn.o_proj.weight": "model-00008-of-00028.safetensors", "model.layers.18.self_attn.q_proj.weight": "model-00008-of-00028.safetensors", "model.layers.18.self_attn.v_proj.weight": "model-00008-of-00028.safetensors", "model.layers.19.input_layernorm.weight": "model-00008-of-00028.safetensors", "model.layers.19.mlp.down_proj.weight": "model-00009-of-00028.safetensors", "model.layers.19.mlp.gate_proj.weight": "model-00009-of-00028.safetensors", "model.layers.19.mlp.up_proj.weight": "model-00009-of-00028.safetensors", "model.layers.19.post_attention_layernorm.weight": "model-00009-of-00028.safetensors", "model.layers.19.self_attn.k_proj.weight": "model-00009-of-00028.safetensors", "model.layers.19.self_attn.o_proj.weight": "model-00009-of-00028.safetensors", "model.layers.19.self_attn.q_proj.weight": "model-00009-of-00028.safetensors", "model.layers.19.self_attn.v_proj.weight": "model-00009-of-00028.safetensors", "model.layers.2.input_layernorm.weight": "model-00009-of-00028.safetensors", "model.layers.2.mlp.down_proj.weight": "model-00009-of-00028.safetensors", "model.layers.2.mlp.gate_proj.weight": "model-00009-of-00028.safetensors", "model.layers.2.mlp.up_proj.weight": "model-00010-of-00028.safetensors", "model.layers.2.post_attention_layernorm.weight": "model-00010-of-00028.safetensors", "model.layers.2.self_attn.k_proj.weight": "model-00010-of-00028.safetensors", "model.layers.2.self_attn.o_proj.weight": "model-00010-of-00028.safetensors", "model.layers.2.self_attn.q_proj.weight": "model-00010-of-00028.safetensors", "model.layers.2.self_attn.v_proj.weight": "model-00010-of-00028.safetensors", "model.layers.20.input_layernorm.weight": "model-00010-of-00028.safetensors", "model.layers.20.mlp.down_proj.weight": "model-00010-of-00028.safetensors", "model.layers.20.mlp.gate_proj.weight": "model-00010-of-00028.safetensors", "model.layers.20.mlp.up_proj.weight": "model-00010-of-00028.safetensors", "model.layers.20.post_attention_layernorm.weight": "model-00010-of-00028.safetensors", "model.layers.20.self_attn.k_proj.weight": "model-00010-of-00028.safetensors", "model.layers.20.self_attn.o_proj.weight": "model-00010-of-00028.safetensors", "model.layers.20.self_attn.q_proj.weight": "model-00010-of-00028.safetensors", "model.layers.20.self_attn.v_proj.weight": "model-00010-of-00028.safetensors", "model.layers.21.input_layernorm.weight": "model-00010-of-00028.safetensors", "model.layers.21.mlp.down_proj.weight": "model-00011-of-00028.safetensors", "model.layers.21.mlp.gate_proj.weight": "model-00011-of-00028.safetensors", "model.layers.21.mlp.up_proj.weight": "model-00011-of-00028.safetensors", "model.layers.21.post_attention_layernorm.weight": "model-00011-of-00028.safetensors", "model.layers.21.self_attn.k_proj.weight": "model-00011-of-00028.safetensors", "model.layers.21.self_attn.o_proj.weight": "model-00011-of-00028.safetensors", "model.layers.21.self_attn.q_proj.weight": "model-00011-of-00028.safetensors", "model.layers.21.self_attn.v_proj.weight": "model-00011-of-00028.safetensors", "model.layers.22.input_layernorm.weight": "model-00011-of-00028.safetensors", "model.layers.22.mlp.down_proj.weight": "model-00011-of-00028.safetensors", "model.layers.22.mlp.gate_proj.weight": "model-00011-of-00028.safetensors", "model.layers.22.mlp.up_proj.weight": "model-00012-of-00028.safetensors", "model.layers.22.post_attention_layernorm.weight": "model-00012-of-00028.safetensors", "model.layers.22.self_attn.k_proj.weight": "model-00012-of-00028.safetensors", "model.layers.22.self_attn.o_proj.weight": "model-00012-of-00028.safetensors", "model.layers.22.self_attn.q_proj.weight": "model-00012-of-00028.safetensors", "model.layers.22.self_attn.v_proj.weight": "model-00012-of-00028.safetensors", "model.layers.23.input_layernorm.weight": "model-00012-of-00028.safetensors", "model.layers.23.mlp.down_proj.weight": "model-00012-of-00028.safetensors", "model.layers.23.mlp.gate_proj.weight": "model-00012-of-00028.safetensors", "model.layers.23.mlp.up_proj.weight": "model-00012-of-00028.safetensors", "model.layers.23.post_attention_layernorm.weight": "model-00012-of-00028.safetensors", "model.layers.23.self_attn.k_proj.weight": "model-00012-of-00028.safetensors", "model.layers.23.self_attn.o_proj.weight": "model-00012-of-00028.safetensors", "model.layers.23.self_attn.q_proj.weight": "model-00012-of-00028.safetensors", "model.layers.23.self_attn.v_proj.weight": "model-00012-of-00028.safetensors", "model.layers.24.input_layernorm.weight": "model-00012-of-00028.safetensors", "model.layers.24.mlp.down_proj.weight": "model-00013-of-00028.safetensors", "model.layers.24.mlp.gate_proj.weight": "model-00013-of-00028.safetensors", "model.layers.24.mlp.up_proj.weight": "model-00013-of-00028.safetensors", "model.layers.24.post_attention_layernorm.weight": "model-00013-of-00028.safetensors", "model.layers.24.self_attn.k_proj.weight": "model-00013-of-00028.safetensors", "model.layers.24.self_attn.o_proj.weight": "model-00013-of-00028.safetensors", "model.layers.24.self_attn.q_proj.weight": "model-00013-of-00028.safetensors", "model.layers.24.self_attn.v_proj.weight": "model-00013-of-00028.safetensors", "model.layers.25.input_layernorm.weight": "model-00013-of-00028.safetensors", "model.layers.25.mlp.down_proj.weight": "model-00013-of-00028.safetensors", "model.layers.25.mlp.gate_proj.weight": "model-00013-of-00028.safetensors", "model.layers.25.mlp.up_proj.weight": "model-00014-of-00028.safetensors", "model.layers.25.post_attention_layernorm.weight": "model-00014-of-00028.safetensors", "model.layers.25.self_attn.k_proj.weight": "model-00014-of-00028.safetensors", "model.layers.25.self_attn.o_proj.weight": "model-00014-of-00028.safetensors", "model.layers.25.self_attn.q_proj.weight": "model-00014-of-00028.safetensors", "model.layers.25.self_attn.v_proj.weight": "model-00014-of-00028.safetensors", "model.layers.26.input_layernorm.weight": "model-00014-of-00028.safetensors", "model.layers.26.mlp.down_proj.weight": "model-00014-of-00028.safetensors", "model.layers.26.mlp.gate_proj.weight": "model-00014-of-00028.safetensors", "model.layers.26.mlp.up_proj.weight": "model-00014-of-00028.safetensors", "model.layers.26.post_attention_layernorm.weight": "model-00014-of-00028.safetensors", "model.layers.26.self_attn.k_proj.weight": "model-00014-of-00028.safetensors", "model.layers.26.self_attn.o_proj.weight": "model-00014-of-00028.safetensors", "model.layers.26.self_attn.q_proj.weight": "model-00014-of-00028.safetensors", "model.layers.26.self_attn.v_proj.weight": "model-00014-of-00028.safetensors", "model.layers.27.input_layernorm.weight": "model-00014-of-00028.safetensors", "model.layers.27.mlp.down_proj.weight": "model-00015-of-00028.safetensors", "model.layers.27.mlp.gate_proj.weight": "model-00015-of-00028.safetensors", "model.layers.27.mlp.up_proj.weight": "model-00015-of-00028.safetensors", "model.layers.27.post_attention_layernorm.weight": "model-00015-of-00028.safetensors", "model.layers.27.self_attn.k_proj.weight": "model-00015-of-00028.safetensors", "model.layers.27.self_attn.o_proj.weight": "model-00015-of-00028.safetensors", "model.layers.27.self_attn.q_proj.weight": "model-00015-of-00028.safetensors", "model.layers.27.self_attn.v_proj.weight": "model-00015-of-00028.safetensors", "model.layers.28.input_layernorm.weight": "model-00015-of-00028.safetensors", "model.layers.28.mlp.down_proj.weight": "model-00015-of-00028.safetensors", "model.layers.28.mlp.gate_proj.weight": "model-00015-of-00028.safetensors", "model.layers.28.mlp.up_proj.weight": "model-00016-of-00028.safetensors", "model.layers.28.post_attention_layernorm.weight": "model-00016-of-00028.safetensors", "model.layers.28.self_attn.k_proj.weight": "model-00016-of-00028.safetensors", "model.layers.28.self_attn.o_proj.weight": "model-00016-of-00028.safetensors", "model.layers.28.self_attn.q_proj.weight": "model-00016-of-00028.safetensors", "model.layers.28.self_attn.v_proj.weight": "model-00016-of-00028.safetensors", "model.layers.29.input_layernorm.weight": "model-00016-of-00028.safetensors", "model.layers.29.mlp.down_proj.weight": "model-00016-of-00028.safetensors", "model.layers.29.mlp.gate_proj.weight": "model-00016-of-00028.safetensors", "model.layers.29.mlp.up_proj.weight": "model-00016-of-00028.safetensors", "model.layers.29.post_attention_layernorm.weight": "model-00016-of-00028.safetensors", "model.layers.29.self_attn.k_proj.weight": "model-00016-of-00028.safetensors", "model.layers.29.self_attn.o_proj.weight": "model-00016-of-00028.safetensors", "model.layers.29.self_attn.q_proj.weight": "model-00016-of-00028.safetensors", "model.layers.29.self_attn.v_proj.weight": "model-00016-of-00028.safetensors", "model.layers.3.input_layernorm.weight": "model-00016-of-00028.safetensors", "model.layers.3.mlp.down_proj.weight": "model-00017-of-00028.safetensors", "model.layers.3.mlp.gate_proj.weight": "model-00017-of-00028.safetensors", "model.layers.3.mlp.up_proj.weight": "model-00017-of-00028.safetensors", "model.layers.3.post_attention_layernorm.weight": "model-00017-of-00028.safetensors", "model.layers.3.self_attn.k_proj.weight": "model-00017-of-00028.safetensors", "model.layers.3.self_attn.o_proj.weight": "model-00017-of-00028.safetensors", "model.layers.3.self_attn.q_proj.weight": "model-00017-of-00028.safetensors", "model.layers.3.self_attn.v_proj.weight": "model-00017-of-00028.safetensors", "model.layers.30.input_layernorm.weight": "model-00017-of-00028.safetensors", "model.layers.30.mlp.down_proj.weight": "model-00017-of-00028.safetensors", "model.layers.30.mlp.gate_proj.weight": "model-00017-of-00028.safetensors", "model.layers.30.mlp.up_proj.weight": "model-00018-of-00028.safetensors", "model.layers.30.post_attention_layernorm.weight": "model-00018-of-00028.safetensors", "model.layers.30.self_attn.k_proj.weight": "model-00018-of-00028.safetensors", "model.layers.30.self_attn.o_proj.weight": "model-00018-of-00028.safetensors", "model.layers.30.self_attn.q_proj.weight": "model-00018-of-00028.safetensors", "model.layers.30.self_attn.v_proj.weight": "model-00018-of-00028.safetensors", "model.layers.31.input_layernorm.weight": "model-00018-of-00028.safetensors", "model.layers.31.mlp.down_proj.weight": "model-00018-of-00028.safetensors", "model.layers.31.mlp.gate_proj.weight": "model-00018-of-00028.safetensors", "model.layers.31.mlp.up_proj.weight": "model-00018-of-00028.safetensors", "model.layers.31.post_attention_layernorm.weight": "model-00018-of-00028.safetensors", "model.layers.31.self_attn.k_proj.weight": "model-00018-of-00028.safetensors", "model.layers.31.self_attn.o_proj.weight": "model-00018-of-00028.safetensors", "model.layers.31.self_attn.q_proj.weight": "model-00018-of-00028.safetensors", "model.layers.31.self_attn.v_proj.weight": "model-00018-of-00028.safetensors", "model.layers.32.input_layernorm.weight": "model-00018-of-00028.safetensors", "model.layers.32.mlp.down_proj.weight": "model-00019-of-00028.safetensors", "model.layers.32.mlp.gate_proj.weight": "model-00019-of-00028.safetensors", "model.layers.32.mlp.up_proj.weight": "model-00019-of-00028.safetensors", "model.layers.32.post_attention_layernorm.weight": "model-00019-of-00028.safetensors", "model.layers.32.self_attn.k_proj.weight": "model-00019-of-00028.safetensors", "model.layers.32.self_attn.o_proj.weight": "model-00019-of-00028.safetensors", "model.layers.32.self_attn.q_proj.weight": "model-00019-of-00028.safetensors", "model.layers.32.self_attn.v_proj.weight": "model-00019-of-00028.safetensors", "model.layers.33.input_layernorm.weight": "model-00019-of-00028.safetensors", "model.layers.33.mlp.down_proj.weight": "model-00019-of-00028.safetensors", "model.layers.33.mlp.gate_proj.weight": "model-00019-of-00028.safetensors", "model.layers.33.mlp.up_proj.weight": "model-00020-of-00028.safetensors", "model.layers.33.post_attention_layernorm.weight": "model-00020-of-00028.safetensors", "model.layers.33.self_attn.k_proj.weight": "model-00020-of-00028.safetensors", "model.layers.33.self_attn.o_proj.weight": "model-00020-of-00028.safetensors", "model.layers.33.self_attn.q_proj.weight": "model-00020-of-00028.safetensors", "model.layers.33.self_attn.v_proj.weight": "model-00020-of-00028.safetensors", "model.layers.34.input_layernorm.weight": "model-00020-of-00028.safetensors", "model.layers.34.mlp.down_proj.weight": "model-00020-of-00028.safetensors", "model.layers.34.mlp.gate_proj.weight": "model-00020-of-00028.safetensors", "model.layers.34.mlp.up_proj.weight": "model-00020-of-00028.safetensors", "model.layers.34.post_attention_layernorm.weight": "model-00020-of-00028.safetensors", "model.layers.34.self_attn.k_proj.weight": "model-00020-of-00028.safetensors", "model.layers.34.self_attn.o_proj.weight": "model-00020-of-00028.safetensors", "model.layers.34.self_attn.q_proj.weight": "model-00020-of-00028.safetensors", "model.layers.34.self_attn.v_proj.weight": "model-00020-of-00028.safetensors", "model.layers.35.input_layernorm.weight": "model-00020-of-00028.safetensors", "model.layers.35.mlp.down_proj.weight": "model-00021-of-00028.safetensors", "model.layers.35.mlp.gate_proj.weight": "model-00021-of-00028.safetensors", "model.layers.35.mlp.up_proj.weight": "model-00021-of-00028.safetensors", "model.layers.35.post_attention_layernorm.weight": "model-00021-of-00028.safetensors", "model.layers.35.self_attn.k_proj.weight": "model-00021-of-00028.safetensors", "model.layers.35.self_attn.o_proj.weight": "model-00021-of-00028.safetensors", "model.layers.35.self_attn.q_proj.weight": "model-00021-of-00028.safetensors", "model.layers.35.self_attn.v_proj.weight": "model-00021-of-00028.safetensors", "model.layers.36.input_layernorm.weight": "model-00021-of-00028.safetensors", "model.layers.36.mlp.down_proj.weight": "model-00021-of-00028.safetensors", "model.layers.36.mlp.gate_proj.weight": "model-00021-of-00028.safetensors", "model.layers.36.mlp.up_proj.weight": "model-00022-of-00028.safetensors", "model.layers.36.post_attention_layernorm.weight": "model-00022-of-00028.safetensors", "model.layers.36.self_attn.k_proj.weight": "model-00022-of-00028.safetensors", "model.layers.36.self_attn.o_proj.weight": "model-00022-of-00028.safetensors", "model.layers.36.self_attn.q_proj.weight": "model-00022-of-00028.safetensors", "model.layers.36.self_attn.v_proj.weight": "model-00022-of-00028.safetensors", "model.layers.37.input_layernorm.weight": "model-00022-of-00028.safetensors", "model.layers.37.mlp.down_proj.weight": "model-00022-of-00028.safetensors", "model.layers.37.mlp.gate_proj.weight": "model-00022-of-00028.safetensors", "model.layers.37.mlp.up_proj.weight": "model-00022-of-00028.safetensors", "model.layers.37.post_attention_layernorm.weight": "model-00022-of-00028.safetensors", "model.layers.37.self_attn.k_proj.weight": "model-00022-of-00028.safetensors", "model.layers.37.self_attn.o_proj.weight": "model-00022-of-00028.safetensors", "model.layers.37.self_attn.q_proj.weight": "model-00022-of-00028.safetensors", "model.layers.37.self_attn.v_proj.weight": "model-00022-of-00028.safetensors", "model.layers.38.input_layernorm.weight": "model-00022-of-00028.safetensors", "model.layers.38.mlp.down_proj.weight": "model-00023-of-00028.safetensors", "model.layers.38.mlp.gate_proj.weight": "model-00023-of-00028.safetensors", "model.layers.38.mlp.up_proj.weight": "model-00023-of-00028.safetensors", "model.layers.38.post_attention_layernorm.weight": "model-00023-of-00028.safetensors", "model.layers.38.self_attn.k_proj.weight": "model-00023-of-00028.safetensors", "model.layers.38.self_attn.o_proj.weight": "model-00023-of-00028.safetensors", "model.layers.38.self_attn.q_proj.weight": "model-00023-of-00028.safetensors", "model.layers.38.self_attn.v_proj.weight": "model-00023-of-00028.safetensors", "model.layers.39.input_layernorm.weight": "model-00023-of-00028.safetensors", "model.layers.39.mlp.down_proj.weight": "model-00023-of-00028.safetensors", "model.layers.39.mlp.gate_proj.weight": "model-00023-of-00028.safetensors", "model.layers.39.mlp.up_proj.weight": "model-00024-of-00028.safetensors", "model.layers.39.post_attention_layernorm.weight": "model-00024-of-00028.safetensors", "model.layers.39.self_attn.k_proj.weight": "model-00024-of-00028.safetensors", "model.layers.39.self_attn.o_proj.weight": "model-00024-of-00028.safetensors", "model.layers.39.self_attn.q_proj.weight": "model-00024-of-00028.safetensors", "model.layers.39.self_attn.v_proj.weight": "model-00024-of-00028.safetensors", "model.layers.4.input_layernorm.weight": "model-00024-of-00028.safetensors", "model.layers.4.mlp.down_proj.weight": "model-00024-of-00028.safetensors", "model.layers.4.mlp.gate_proj.weight": "model-00024-of-00028.safetensors", "model.layers.4.mlp.up_proj.weight": "model-00024-of-00028.safetensors", "model.layers.4.post_attention_layernorm.weight": "model-00024-of-00028.safetensors", "model.layers.4.self_attn.k_proj.weight": "model-00024-of-00028.safetensors", "model.layers.4.self_attn.o_proj.weight": "model-00024-of-00028.safetensors", "model.layers.4.self_attn.q_proj.weight": "model-00024-of-00028.safetensors", "model.layers.4.self_attn.v_proj.weight": "model-00024-of-00028.safetensors", "model.layers.5.input_layernorm.weight": "model-00024-of-00028.safetensors", "model.layers.5.mlp.down_proj.weight": "model-00025-of-00028.safetensors", "model.layers.5.mlp.gate_proj.weight": "model-00025-of-00028.safetensors", "model.layers.5.mlp.up_proj.weight": "model-00025-of-00028.safetensors", "model.layers.5.post_attention_layernorm.weight": "model-00025-of-00028.safetensors", "model.layers.5.self_attn.k_proj.weight": "model-00025-of-00028.safetensors", "model.layers.5.self_attn.o_proj.weight": "model-00025-of-00028.safetensors", "model.layers.5.self_attn.q_proj.weight": "model-00025-of-00028.safetensors", "model.layers.5.self_attn.v_proj.weight": "model-00025-of-00028.safetensors", "model.layers.6.input_layernorm.weight": "model-00025-of-00028.safetensors", "model.layers.6.mlp.down_proj.weight": "model-00025-of-00028.safetensors", "model.layers.6.mlp.gate_proj.weight": "model-00025-of-00028.safetensors", "model.layers.6.mlp.up_proj.weight": "model-00026-of-00028.safetensors", "model.layers.6.post_attention_layernorm.weight": "model-00026-of-00028.safetensors", "model.layers.6.self_attn.k_proj.weight": "model-00026-of-00028.safetensors", "model.layers.6.self_attn.o_proj.weight": "model-00026-of-00028.safetensors", "model.layers.6.self_attn.q_proj.weight": "model-00026-of-00028.safetensors", "model.layers.6.self_attn.v_proj.weight": "model-00026-of-00028.safetensors", "model.layers.7.input_layernorm.weight": "model-00026-of-00028.safetensors", "model.layers.7.mlp.down_proj.weight": "model-00026-of-00028.safetensors", "model.layers.7.mlp.gate_proj.weight": "model-00026-of-00028.safetensors", "model.layers.7.mlp.up_proj.weight": "model-00026-of-00028.safetensors", "model.layers.7.post_attention_layernorm.weight": "model-00026-of-00028.safetensors", "model.layers.7.self_attn.k_proj.weight": "model-00026-of-00028.safetensors", "model.layers.7.self_attn.o_proj.weight": "model-00026-of-00028.safetensors", "model.layers.7.self_attn.q_proj.weight": "model-00026-of-00028.safetensors", "model.layers.7.self_attn.v_proj.weight": "model-00026-of-00028.safetensors", "model.layers.8.input_layernorm.weight": "model-00026-of-00028.safetensors", "model.layers.8.mlp.down_proj.weight": "model-00027-of-00028.safetensors", "model.layers.8.mlp.gate_proj.weight": "model-00027-of-00028.safetensors", "model.layers.8.mlp.up_proj.weight": "model-00027-of-00028.safetensors", "model.layers.8.post_attention_layernorm.weight": "model-00027-of-00028.safetensors", "model.layers.8.self_attn.k_proj.weight": "model-00027-of-00028.safetensors", "model.layers.8.self_attn.o_proj.weight": "model-00027-of-00028.safetensors", "model.layers.8.self_attn.q_proj.weight": "model-00027-of-00028.safetensors", "model.layers.8.self_attn.v_proj.weight": "model-00027-of-00028.safetensors", "model.layers.9.input_layernorm.weight": "model-00027-of-00028.safetensors", "model.layers.9.mlp.down_proj.weight": "model-00027-of-00028.safetensors", "model.layers.9.mlp.gate_proj.weight": "model-00027-of-00028.safetensors", "model.layers.9.mlp.up_proj.weight": "model-00028-of-00028.safetensors", "model.layers.9.post_attention_layernorm.weight": "model-00028-of-00028.safetensors", "model.layers.9.self_attn.k_proj.weight": "model-00028-of-00028.safetensors", "model.layers.9.self_attn.o_proj.weight": "model-00028-of-00028.safetensors", "model.layers.9.self_attn.q_proj.weight": "model-00028-of-00028.safetensors", "model.layers.9.self_attn.v_proj.weight": "model-00028-of-00028.safetensors", "model.norm.weight": "model-00028-of-00028.safetensors"}}
special_tokens_map.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|assistant|>",
4
+ "<|prefix_end|>",
5
+ "<|system|>",
6
+ "<|prefix_begin|>",
7
+ "<|prompter|>"
8
+ ],
9
+ "bos_token": {
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "pad_token": {
24
+ "content": "</s>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "sep_token": {
31
+ "content": "<s>",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "unk_token": {
38
+ "content": "<unk>",
39
+ "lstrip": false,
40
+ "normalized": true,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ }
44
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
3
+ size 499723
tokenizer_config.json ADDED
@@ -0,0 +1,96 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "added_tokens_decoder": {
5
+ "0": {
6
+ "content": "<unk>",
7
+ "lstrip": false,
8
+ "normalized": true,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "1": {
14
+ "content": "<s>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "2": {
22
+ "content": "</s>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ },
29
+ "32000": {
30
+ "content": "<pad>",
31
+ "lstrip": false,
32
+ "normalized": true,
33
+ "rstrip": false,
34
+ "single_word": false,
35
+ "special": false
36
+ },
37
+ "32001": {
38
+ "content": "<|assistant|>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false,
43
+ "special": true
44
+ },
45
+ "32002": {
46
+ "content": "<|prefix_end|>",
47
+ "lstrip": false,
48
+ "normalized": false,
49
+ "rstrip": false,
50
+ "single_word": false,
51
+ "special": true
52
+ },
53
+ "32003": {
54
+ "content": "<|system|>",
55
+ "lstrip": false,
56
+ "normalized": false,
57
+ "rstrip": false,
58
+ "single_word": false,
59
+ "special": true
60
+ },
61
+ "32004": {
62
+ "content": "<|prefix_begin|>",
63
+ "lstrip": false,
64
+ "normalized": false,
65
+ "rstrip": false,
66
+ "single_word": false,
67
+ "special": true
68
+ },
69
+ "32005": {
70
+ "content": "<|prompter|>",
71
+ "lstrip": false,
72
+ "normalized": false,
73
+ "rstrip": false,
74
+ "single_word": false,
75
+ "special": true
76
+ }
77
+ },
78
+ "additional_special_tokens": [
79
+ "<|assistant|>",
80
+ "<|prefix_end|>",
81
+ "<|system|>",
82
+ "<|prefix_begin|>",
83
+ "<|prompter|>"
84
+ ],
85
+ "bos_token": "<s>",
86
+ "clean_up_tokenization_spaces": false,
87
+ "eos_token": "</s>",
88
+ "legacy": false,
89
+ "model_max_length": 1000000000000000019884624838656,
90
+ "pad_token": "</s>",
91
+ "sep_token": "<s>",
92
+ "sp_model_kwargs": {},
93
+ "tokenizer_class": "LlamaTokenizer",
94
+ "unk_token": "<unk>",
95
+ "use_default_system_prompt": false
96
+ }