cpatonn commited on
Commit
0c11e38
·
verified ·
1 Parent(s): 36f4419

Upload folder using huggingface_hub

Browse files
README.md ADDED
@@ -0,0 +1,358 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: transformers
3
+ license: other
4
+ license_name: lfm1.0
5
+ license_link: LICENSE
6
+ language:
7
+ - en
8
+ - ar
9
+ - zh
10
+ - fr
11
+ - de
12
+ - ja
13
+ - ko
14
+ - es
15
+ pipeline_tag: text-generation
16
+ tags:
17
+ - liquid
18
+ - lfm2
19
+ - edge
20
+ - moe
21
+ base_model: LiquidAI/LFM2-8B-A1B
22
+ ---
23
+
24
+ <center>
25
+ <div style="text-align: center;">
26
+ <img
27
+ src="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/7_6D7rWrLxp2hb6OHSV1p.png"
28
+ alt="Liquid AI"
29
+ style="width: 100%; max-width: 66%; height: auto; display: inline-block; margin-bottom: 0.5em; margin-top: 0.5em;"
30
+ />
31
+ </div>
32
+ <div style="display: flex; justify-content: center;">
33
+ <a href="https://playground.liquid.ai/chat">
34
+ <svg width="114.8" height="20" viewBox="0 0 900 200" xmlns="http://www.w3.org/2000/svg" role="img" aria-label="Playground" style="margin-bottom: 1em;">
35
+ <title>Playground</title>
36
+ <g>
37
+ <rect fill="#fff" width="200" height="200"></rect>
38
+ <rect fill="url(#x)" x="200" width="800" height="200"></rect>
39
+ </g>
40
+ <g transform="translate(35, 30) scale(0.45, 0.45)">
41
+ <path d="M172.314 129.313L172.219 129.367L206.125 188.18C210.671 195.154 213.324 203.457 213.324 212.382C213.324 220.834 210.956 228.739 206.839 235.479L275.924 213.178L167.853 33.6L141.827 76.9614L172.314 129.313Z" fill="black"/>
42
+ <path d="M114.217 302.4L168.492 257.003C168.447 257.003 168.397 257.003 168.352 257.003C143.515 257.003 123.385 237.027 123.385 212.387C123.385 203.487 126.023 195.204 130.55 188.24L162.621 132.503L135.966 86.7327L60.0762 213.183L114.127 302.4H114.217Z" fill="black"/>
43
+ <path d="M191.435 250.681C191.435 250.681 191.43 250.681 191.425 250.686L129.71 302.4H221.294L267.71 226.593L191.435 250.686V250.681Z" fill="black"/>
44
+ </g>
45
+ <g transform="translate(50, 0)" aria-hidden="true" fill="#fff" text-anchor="start" font-family="Verdana,DejaVu Sans,sans-serif" font-size="110">
46
+ <text x="255" y="148" textLength="619" fill="#000" opacity="0.1">Playground</text>
47
+ <text x="245" y="138" textLength="619">Playground</text>
48
+ </g>
49
+ <linearGradient id="x" x1="0%" y1="0%" x2="100%" y2="0%">
50
+ <stop offset="0%" style="stop-color:#000000"></stop>
51
+ <stop offset="100%" style="stop-color:#000000"></stop>
52
+ </linearGradient>
53
+ </svg>
54
+ </a>
55
+ <a href="https://leap.liquid.ai/?utm_source=huggingface&utm_medium=modelcards">
56
+ <svg width="114.8" height="20" viewBox="0 0 900 200" xmlns="http://www.w3.org/2000/svg" role="img" aria-label="Leap" style="margin-bottom: 1em;">
57
+ <title>Leap</title>
58
+ <g>
59
+ <rect fill="#000" width="500" height="200"></rect>
60
+ </g>
61
+ <g transform="translate(100, 45) scale(3.5, 3.5)" fill="#fff">
62
+ <path d="M13.8512 28.0769C12.5435 28.0769 11.4025 27.8205 10.4281 27.3077C9.45375 26.7692 8.68452 26.0128 8.12042 25.0385C7.58196 24.0641 7.31273 22.9359 7.31273 21.6538V3.76923H0.389648V0H11.4666V21.6538C11.4666 22.4744 11.6973 23.1282 12.1589 23.6154C12.6204 24.0769 13.2486 24.3077 14.0435 24.3077H20.582V28.0769H13.8512Z"/>
63
+ <path d="M29.6439 28.4615C27.9259 28.4615 26.4131 28.1282 25.1054 27.4615C23.8233 26.7692 22.8362 25.8077 22.1439 24.5769C21.4516 23.3462 21.1054 21.9103 21.1054 20.2692V14.7308C21.1054 13.0641 21.4516 11.6282 22.1439 10.4231C22.8362 9.19231 23.8233 8.24359 25.1054 7.57692C26.4131 6.88462 27.9259 6.53846 29.6439 6.53846C31.3875 6.53846 32.9003 6.88462 34.1823 7.57692C35.4644 8.24359 36.4516 9.19231 37.1439 10.4231C37.8362 11.6282 38.1823 13.0641 38.1823 14.7308V18.5H25.1054V20.2692C25.1054 21.8333 25.49 23.0256 26.2592 23.8462C27.0541 24.6667 28.1951 25.0769 29.6823 25.0769C30.8875 25.0769 31.8618 24.8718 32.6054 24.4615C33.349 24.0256 33.8105 23.3974 33.99 22.5769H38.1054C37.7977 24.3718 36.8746 25.8077 35.3362 26.8846C33.7977 27.9359 31.9003 28.4615 29.6439 28.4615ZM34.1823 16V14.6923C34.1823 13.1538 33.7977 11.9615 33.0285 11.1154C32.2592 10.2692 31.131 9.84615 29.6439 9.84615C28.1823 9.84615 27.0541 10.2692 26.2592 11.1154C25.49 11.9615 25.1054 13.1667 25.1054 14.7308V15.6923L34.49 15.6538L34.1823 16Z"/>
64
+ <path d="M46.3596 28.4615C44.1545 28.4615 42.4109 27.8974 41.1288 26.7692C39.8724 25.6154 39.2442 24.0513 39.2442 22.0769C39.2442 20.0769 39.9109 18.5128 41.2442 17.3846C42.6032 16.2308 44.4622 15.6538 46.8211 15.6538H52.7058V13.6923C52.7058 12.5385 52.3468 11.641 51.6288 11C50.9109 10.359 49.8981 10.0385 48.5904 10.0385C47.4365 10.0385 46.475 10.2949 45.7058 10.8077C44.9365 11.2949 44.4878 11.9487 44.3596 12.7692H40.2827C40.5135 10.8718 41.3852 9.35897 42.8981 8.23077C44.4365 7.10256 46.3724 6.53846 48.7058 6.53846C51.2186 6.53846 53.2058 7.17949 54.6673 8.46154C56.1288 9.71795 56.8596 11.4359 56.8596 13.6154V28.0769H52.8211V24.1923H52.1288L52.8211 23.4231C52.8211 24.9615 52.2314 26.1923 51.0519 27.1154C49.8724 28.0128 48.3083 28.4615 46.3596 28.4615ZM47.5904 25.2692C49.0776 25.2692 50.2955 24.8974 51.2442 24.1538C52.2186 23.3846 52.7058 22.4103 52.7058 21.2308V18.4615H46.8981C45.8211 18.4615 44.9622 18.7564 44.3211 19.3462C43.7058 19.9359 43.3981 20.7436 43.3981 21.7692C43.3981 22.8462 43.7699 23.7051 44.5135 24.3462C45.257 24.9615 46.2827 25.2692 47.5904 25.2692Z"/>
65
+ <path d="M58.9984 35V6.92308H63.1138V10.9615H63.9984L63.1138 11.9231C63.1138 10.2564 63.6266 8.94872 64.6523 8C65.7036 7.02564 67.101 6.53846 68.8446 6.53846C70.9728 6.53846 72.6651 7.25641 73.9215 8.69231C75.2036 10.1026 75.8446 12.0385 75.8446 14.5V20.4615C75.8446 22.1026 75.5497 23.5256 74.96 24.7308C74.3959 25.9103 73.5882 26.8333 72.5369 27.5C71.5113 28.141 70.2805 28.4615 68.8446 28.4615C67.1266 28.4615 65.742 27.9872 64.6907 27.0385C63.6395 26.0641 63.1138 24.7436 63.1138 23.0769L63.9984 24.0385H63.0369L63.1523 28.9615V35H58.9984ZM67.4215 24.8462C68.7805 24.8462 69.8318 24.4615 70.5754 23.6923C71.3446 22.8974 71.7292 21.7564 71.7292 20.2692V14.7308C71.7292 13.2436 71.3446 12.1154 70.5754 11.3462C69.8318 10.5513 68.7805 10.1538 67.4215 10.1538C66.1138 10.1538 65.0754 10.5641 64.3061 11.3846C63.5369 12.1795 63.1523 13.2949 63.1523 14.7308V20.2692C63.1523 21.7051 63.5369 22.8333 64.3061 23.6538C65.0754 24.4487 66.1138 24.8462 67.4215 24.8462Z"/>
66
+ </g>
67
+ <linearGradient id="y" x1="0%" y1="0%" x2="100%" y2="0%">
68
+ <stop offset="0%" style="stop-color:#000000"></stop>
69
+ </linearGradient>
70
+ </svg>
71
+ </a>
72
+ </div>
73
+ </center>
74
+
75
+ # LFM2-8B-A1B
76
+
77
+ LFM2 is a new generation of hybrid models developed by [Liquid AI](https://www.liquid.ai/blog/lfm2-8b-a1b-an-efficient-on-device-mixture-of-experts), specifically designed for edge AI and on-device deployment. It sets a new standard in terms of quality, speed, and memory efficiency.
78
+
79
+ We're releasing the weights of our first MoE based on LFM2, with 8.3B total parameters and 1.5B active parameters.
80
+
81
+ - LFM2-8B-A1B is the best on-device MoE in terms of both **quality** (comparable to 3-4B dense models) and **speed** (faster than Qwen3-1.7B).
82
+ - **Code and knowledge** capabilities are significantly improved compared to LFM2-2.6B.
83
+ - Quantized variants fit comfortably on high-end **phones, tablets, and laptops**.
84
+
85
+ Find more information about LFM2-8B-A1B in our [blog post](https://www.liquid.ai/blog/).
86
+
87
+ ## 📄 Model details
88
+
89
+ Due to their small size, **we recommend fine-tuning LFM2 models on narrow use cases** to maximize performance.
90
+ They are particularly suited for agentic tasks, data extraction, RAG, creative writing, and multi-turn conversations.
91
+ However, we do not recommend using them for tasks that are knowledge-intensive or require programming skills.
92
+
93
+ | Property | [**LFM2-8B-A1B**](https://huggingface.co/LiquidAI/LFM2-8B-A1B) |
94
+ | --------------------- | ----------------------------- |
95
+ | **Total parameters** | 8.3B |
96
+ | **Active parameters** | 1.5B |
97
+ | **Layers** | 24 (18 conv + 6 attn) |
98
+ | **Context length** | 32,768 tokens |
99
+ | **Vocabulary size** | 65,536 |
100
+ | **Training precision**| Mixed BF16/FP8 |
101
+ | **Training budget** | 12 trillion tokens |
102
+ | **License** | LFM Open License v1.0 |
103
+
104
+ **Supported languages**: English, Arabic, Chinese, French, German, Japanese, Korean, and Spanish.
105
+
106
+ **Generation parameters**: We recommend the following parameters:
107
+ * `temperature=0.3`
108
+ * `min_p=0.15`
109
+ * `repetition_penalty=1.05`
110
+
111
+ **Chat template**: LFM2 uses a ChatML-like chat template as follows:
112
+
113
+ ```
114
+ <|startoftext|><|im_start|>system
115
+ You are a helpful assistant trained by Liquid AI.<|im_end|>
116
+ <|im_start|>user
117
+ What is C. elegans?<|im_end|>
118
+ <|im_start|>assistant
119
+ It's a tiny nematode that lives in temperate soil environments.<|im_end|>
120
+ ```
121
+
122
+ You can automatically apply it using the dedicated [`.apply_chat_template()`](https://huggingface.co/docs/transformers/en/chat_templating#applychattemplate) function from Hugging Face transformers.
123
+
124
+ **Tool use**: It consists of four main steps:
125
+ 1. **Function definition**: LFM2 takes JSON function definitions as input (JSON objects between `<|tool_list_start|>` and `<|tool_list_end|>` special tokens), usually in the system prompt
126
+ 2. **Function call**: LFM2 writes Pythonic function calls (a Python list between `<|tool_call_start|>` and `<|tool_call_end|>` special tokens), as the assistant answer.
127
+ 3. **Function execution**: The function call is executed and the result is returned (string between `<|tool_response_start|>` and `<|tool_response_end|>` special tokens), as a "tool" role.
128
+ 4. **Final answer**: LFM2 interprets the outcome of the function call to address the original user prompt in plain text.
129
+
130
+ Here is a simple example of a conversation using tool use:
131
+
132
+ ```
133
+ <|startoftext|><|im_start|>system
134
+ List of tools: <|tool_list_start|>[{"name": "get_candidate_status", "description": "Retrieves the current status of a candidate in the recruitment process", "parameters": {"type": "object", "properties": {"candidate_id": {"type": "string", "description": "Unique identifier for the candidate"}}, "required": ["candidate_id"]}}]<|tool_list_end|><|im_end|>
135
+ <|im_start|>user
136
+ What is the current status of candidate ID 12345?<|im_end|>
137
+ <|im_start|>assistant
138
+ <|tool_call_start|>[get_candidate_status(candidate_id="12345")]<|tool_call_end|>Checking the current status of candidate ID 12345.<|im_end|>
139
+ <|im_start|>tool
140
+ <|tool_response_start|>{"candidate_id": "12345", "status": "Interview Scheduled", "position": "Clinical Research Associate", "date": "2023-11-20"}<|tool_response_end|><|im_end|>
141
+ <|im_start|>assistant
142
+ The candidate with ID 12345 is currently in the "Interview Scheduled" stage for the position of Clinical Research Associate, with an interview date set for 2023-11-20.<|im_end|>
143
+ ```
144
+
145
+ **Architecture**: Hybrid model with multiplicative gates and short convolutions: 18 double-gated short-range LIV convolution blocks and 6 grouped query attention (GQA) blocks.
146
+
147
+ **Pre-training mixture**: Approximately 75% English, 20% multilingual, and 5% code data sourced from the web and licensed materials.
148
+
149
+ **Training approach**:
150
+ * Very large-scale SFT on 50% downstream tasks, 50% general domains
151
+ * Custom DPO with length normalization and semi-online datasets
152
+ * Iterative model merging
153
+
154
+ ## 🏃 How to run LFM2
155
+
156
+ ### 1. Transformers
157
+
158
+ To run LFM2, you need to install Hugging Face [`transformers`](https://github.com/huggingface/transformers) from source as follows:
159
+ ```bash
160
+ pip install git+https://github.com/huggingface/transformers.git@0c9a72e4576fe4c84077f066e585129c97bfd4e6
161
+ ```
162
+
163
+ Here is an example of how to generate an answer with transformers in Python:
164
+
165
+ ```python
166
+ from transformers import AutoModelForCausalLM, AutoTokenizer
167
+
168
+ # Load model and tokenizer
169
+ model_id = "LiquidAI/LFM2-8B-A1B"
170
+ model = AutoModelForCausalLM.from_pretrained(
171
+ model_id,
172
+ device_map="auto",
173
+ dtype="bfloat16",
174
+ # attn_implementation="flash_attention_2" <- uncomment on compatible GPU
175
+ )
176
+ tokenizer = AutoTokenizer.from_pretrained(model_id)
177
+
178
+ # Generate answer
179
+ prompt = "What is C. elegans?"
180
+ input_ids = tokenizer.apply_chat_template(
181
+ [{"role": "user", "content": prompt}],
182
+ add_generation_prompt=True,
183
+ return_tensors="pt",
184
+ tokenize=True,
185
+ ).to(model.device)
186
+
187
+ output = model.generate(
188
+ input_ids,
189
+ do_sample=True,
190
+ temperature=0.3,
191
+ min_p=0.15,
192
+ repetition_penalty=1.05,
193
+ max_new_tokens=512,
194
+ )
195
+
196
+ print(tokenizer.decode(output[0], skip_special_tokens=False))
197
+
198
+ # <|startoftext|><|im_start|>user
199
+ # What is C. elegans?<|im_end|>
200
+ # <|im_start|>assistant
201
+ # C. elegans, also known as Caenorhabditis elegans, is a small, free-living
202
+ # nematode worm (roundworm) that belongs to the phylum Nematoda.
203
+ ```
204
+
205
+ You can directly run and test the model with this [Colab notebook](https://colab.research.google.com/drive/1i0u7X6qen9UJkV6xSCDZ0NmPUH50SOvO?usp=sharing).
206
+
207
+ ### 2. vLLM
208
+
209
+ You can run the model in [`vLLM`](https://github.com/vllm-project/vllm) by building from source:
210
+
211
+ ```bash
212
+ git clone https://github.com/vllm-project/vllm.git
213
+ cd vllm
214
+ pip install -e . -v
215
+ ```
216
+
217
+ Here is an example of how to use it for inference:
218
+
219
+ ```python
220
+ from vllm import LLM, SamplingParams
221
+
222
+ prompts = [
223
+ [
224
+ {
225
+ "content": "What is C. elegans?",
226
+ "role": "user",
227
+ },
228
+ ],
229
+ [
230
+ {
231
+ "content": "Say hi in JSON format",
232
+ "role": "user",
233
+ },
234
+ ],
235
+ [
236
+ {
237
+ "content": "Define AI in Spanish",
238
+ "role": "user",
239
+ },
240
+ ],
241
+ ]
242
+
243
+ sampling_params = SamplingParams(
244
+ temperature=0.3,
245
+ min_p=0.15,
246
+ repetition_penalty=1.05,
247
+ max_tokens=30
248
+ )
249
+
250
+ llm = LLM(model="LiquidAI/LFM2-8B-A1B", dtype="bfloat16")
251
+
252
+ outputs = llm.chat(prompts, sampling_params)
253
+
254
+ for i, output in enumerate(outputs):
255
+ prompt = prompts[i][0]["content"]
256
+ generated_text = output.outputs[0].text
257
+ print(f"Prompt: {prompt!r}, Generated text: {generated_text!r}")
258
+ ```
259
+
260
+
261
+ ### 3. llama.cpp
262
+
263
+ You can run LFM2 with llama.cpp using its [GGUF checkpoint](https://huggingface.co/LiquidAI/LFM2-8B-A1B-GGUF). Find more information in the model card.
264
+
265
+ ## 🔧 How to fine-tune LFM2
266
+
267
+ We recommend fine-tuning LFM2 models on your use cases to maximize performance.
268
+
269
+ | Notebook | Description | Link |
270
+ |-------|------|------|
271
+ | SFT (TRL) | Supervised Fine-Tuning (SFT) notebook with a LoRA adapter using TRL. | <a href="https://colab.research.google.com/drive/1OXLEuSmzF4AjJ7yqRCDTn-ltvFjoGR9j?usp=sharing"><img src="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/vlOyMEjwHa_b_LXysEu2E.png" width="110" alt="Colab link"></a> |
272
+ | DPO (TRL) | Preference alignment with Direct Preference Optimization (DPO) using TRL. | <a href="https://colab.research.google.com/drive/1Q8hIHIQ8oofshcNYHUcYp1akUcZ-ufSn?usp=sharing"><img src="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/vlOyMEjwHa_b_LXysEu2E.png" width="110" alt="Colab link"></a> |
273
+
274
+ ## 📈 Performance
275
+
276
+ ### 1. Automated benchmarks
277
+
278
+ <div style="display: grid">
279
+ <div>
280
+ <a href="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/6xXgpyyK5htUZlHdpZab-.png" target="_blank">
281
+ <img src="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/6xXgpyyK5htUZlHdpZab-.png" alt="Benchmarks" style="width: 100%; height: auto; margin: 0; cursor: pointer;">
282
+ </a>
283
+ </div>
284
+ </div>
285
+
286
+ Compared to similar-sized models, LFM2-8B-A1B displays strong performance in instruction following and math while also running significantly faster.
287
+
288
+ | Model | MMLU | MMLU-Pro | GPQA | IFEval | IFBench | Multi-IF |
289
+ |---|---|---|---|---|---|---|
290
+ | **LFM2-8B-A1B** | 64.84 | 37.42 | 29.29 | 77.58 | 25.85 | 58.19 |
291
+ | LFM2-2.6B | 64.42 | 25.96 | 26.57 | 79.56 | 22.19 | 60.26 |
292
+ | Llama-3.2-3B-Instruct | 60.35 | 22.25 | 30.6 | 71.43 | 20.78 | 50.91 |
293
+ | SmolLM3-3B | 59.84 | 23.90 | 26.31 | 72.44 | 17.93 | 58.86 |
294
+ | gemma-3-4b-it | 58.35 | 34.76 | 29.51 | 76.85 | 23.53 | 66.61 |
295
+ | Qwen3-4B-Instruct-2507 | 72.25 | 52.31 | 34.85 | 85.62 | 30.28 | 75.54 |
296
+ | granite-4.0-h-tiny | 66.79 | 32.03 | 26.46 | 81.06 | 18.37 | 52.99 |
297
+
298
+ | Model | GSM8K | GSMPlus | MATH 500 | MATH Lvl 5 | MGSM | MMMLU |
299
+ |---|---|---|---|---|---|---|
300
+ | **LFM2-8B-A1B** | 84.38 | 64.76 | 74.2 | 62.38 | 72.4 | 55.26 |
301
+ | LFM2-2.6B | 82.41 | 60.75 | 63.6 | 54.38 | 74.32 | 55.39 |
302
+ | Llama-3.2-3B-Instruct | 75.21 | 38.68 | 41.2 | 24.06 | 61.68 | 47.92 |
303
+ | SmolLM3-3B | 81.12 | 58.91 | 73.6 | 51.93 | 68.72 | 50.02 |
304
+ | gemma-3-4b-it | 89.92 | 68.38 | 73.2 | 52.18 | 87.28 | 50.14 |
305
+ | Qwen3-4B-Instruct-2507 | 68.46 | 56.16 | 85.6 | 73.62 | 81.76 | 60.67 |
306
+ | granite-4.0-h-tiny | 82.64 | 59.14 | 58.2 | 36.11 | 73.68 | 56.13 |
307
+
308
+ | Model | Active params | LCB v6 | LCB v5 | HumanEval+ | Creative Writing v3 |
309
+ |----------------------------|---------------|---------------|---------------|--------------------|-----------------------------|
310
+ | **LFM2-8B-A1B** | 1.5B | 21.04% | 21.36% | 69.51% | 44.22% |
311
+ | Gemma-3-1b-it | 1B | 4.27% | 4.43% | 37.20% | 41.67% |
312
+ | Granite-4.0-h-tiny | 1B | 26.73% | 27.27% | 73.78% | 32.60% |
313
+ | Llama-3.2-1B-Instruct | 1.2B | 4.08% | 3.64% | 23.17% | 31.43% |
314
+ | Qwen2.5-1.5B-Instruct | 1.5B | 11.18% | 10.57% | 48.78% | 22.18% |
315
+ | Qwen3-1.7B (/no_think) | 1.7B | 24.07% | 26.48% | 60.98% | 31.56% |
316
+ | LFM2-2.6B | 2.6B | 14.41% | 14.43% | 57.93% | 38.79% |
317
+ | SmolLM3-3B | 3.1B | 19.05% | 19.20% | 60.37% | 36.44% |
318
+ | Llama-3.2-3B-Instruct | 3.2B | 11.47% | 11.48% | 24.06% | 38.84% |
319
+ | Qwen3-4B (/no_think) | 4B | 36.11% | 38.64% | 71.95% | 37.49% |
320
+ | Qwen3-4B-Instruct-2507 | 4B | 48.72% | 50.80% | 82.32% | 51.71% |
321
+ | Gemma-3-4b-it | 4.3B | 18.86% | 19.09% | 62.8% | 68.56% |
322
+
323
+ ### 2. Inference
324
+
325
+ LFM2-8B-A1B is significantly faster than models with a similar number of active parameters, like Qwen3-1.7B.
326
+
327
+ <div style="display: grid; grid-template-columns: 1fr 1fr;">
328
+ <div>
329
+ <a href="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/AdR74EuIH_qJre89qaq62.png" target="_blank">
330
+ <img src="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/AdR74EuIH_qJre89qaq62.png" alt="Decode Throughput - S24 Ultra" style="width: 100%; height: auto; margin: 0; cursor: pointer;">
331
+ </a>
332
+ </div>
333
+
334
+ <div>
335
+ <a href="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/YzmQXbmcv5WuVJ1tI2Jbh.png" target="_blank">
336
+ <img src="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/YzmQXbmcv5WuVJ1tI2Jbh.png" alt="Decode Throughput - HX370" style="width: 100%; height: auto; margin: 0; cursor: pointer;">
337
+ </a>
338
+ </div>
339
+ </div>
340
+
341
+ The following plots showcase the performance of different models under int4 quantization with int8 dynamic activations on the AMD Ryzen AI 9 HX 370 CPU, using 16 threads. The results are obtained using our internal XNNPACK-based inference stack, and a custom CPU MoE kernel.
342
+
343
+ <div style="display: grid; grid-template-columns: 1fr 1fr;">
344
+ <div>
345
+ <a href="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/NC4XN11RJB-Ifh758os3e.png" target="_blank">
346
+ <img src="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/NC4XN11RJB-Ifh758os3e.png" alt="Prefill Throughput vs Sequence Length" style="width: 100%; height: auto; margin: 0; cursor: pointer;">
347
+ </a>
348
+ </div>
349
+ <div>
350
+ <a href="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/6oAenHRxKIyvJOgdCetlF.png" target="_blank">
351
+ <img src="https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/6oAenHRxKIyvJOgdCetlF.png" alt="Decode Throughput vs Sequence Length" style="width: 100%; height: auto; margin: 0; cursor: pointer;">
352
+ </a>
353
+ </div>
354
+ </div>
355
+
356
+ ## 📬 Contact
357
+
358
+ If you are interested in custom solutions with edge deployment, please contact [our sales team](https://www.liquid.ai/contact).
chat_template.jinja ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {{- bos_token -}}{%- set system_prompt = "" -%}{%- set ns = namespace(system_prompt="") -%}{%- if messages[0]["role"] == "system" -%} {%- set ns.system_prompt = messages[0]["content"] -%} {%- set messages = messages[1:] -%}{%- endif -%}{%- if tools -%} {%- set ns.system_prompt = ns.system_prompt + ("
2
+ " if ns.system_prompt else "") + "List of tools: <|tool_list_start|>[" -%} {%- for tool in tools -%} {%- if tool is not string -%} {%- set tool = tool | tojson -%} {%- endif -%} {%- set ns.system_prompt = ns.system_prompt + tool -%} {%- if not loop.last -%} {%- set ns.system_prompt = ns.system_prompt + ", " -%} {%- endif -%} {%- endfor -%} {%- set ns.system_prompt = ns.system_prompt + "]<|tool_list_end|>" -%}{%- endif -%}{%- if ns.system_prompt -%} {{- "<|im_start|>system
3
+ " + ns.system_prompt + "<|im_end|>
4
+ " -}}{%- endif -%}{%- for message in messages -%} {{- "<|im_start|>" + message["role"] + "
5
+ " -}} {%- set content = message["content"] -%} {%- if content is not string -%} {%- set content = content | tojson -%} {%- endif -%} {%- if message["role"] == "tool" -%} {%- set content = "<|tool_response_start|>" + content + "<|tool_response_end|>" -%} {%- endif -%} {{- content + "<|im_end|>
6
+ " -}}{%- endfor -%}{%- if add_generation_prompt -%} {{- "<|im_start|>assistant
7
+ " -}}{%- endif -%}
config.json ADDED
@@ -0,0 +1,180 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Lfm2MoeForCausalLM"
4
+ ],
5
+ "bos_token_id": 1,
6
+ "conv_L_cache": 3,
7
+ "conv_bias": false,
8
+ "dtype": "bfloat16",
9
+ "eos_token_id": 7,
10
+ "hidden_size": 2048,
11
+ "intermediate_size": 7168,
12
+ "layer_types": [
13
+ "conv",
14
+ "conv",
15
+ "full_attention",
16
+ "conv",
17
+ "conv",
18
+ "conv",
19
+ "full_attention",
20
+ "conv",
21
+ "conv",
22
+ "conv",
23
+ "full_attention",
24
+ "conv",
25
+ "conv",
26
+ "conv",
27
+ "full_attention",
28
+ "conv",
29
+ "conv",
30
+ "conv",
31
+ "full_attention",
32
+ "conv",
33
+ "conv",
34
+ "full_attention",
35
+ "conv",
36
+ "conv"
37
+ ],
38
+ "max_position_embeddings": 128000,
39
+ "model_type": "lfm2_moe",
40
+ "moe_intermediate_size": 1792,
41
+ "norm_eps": 1e-05,
42
+ "norm_topk_prob": true,
43
+ "num_attention_heads": 32,
44
+ "num_dense_layers": 2,
45
+ "num_experts": 32,
46
+ "num_experts_per_tok": 4,
47
+ "num_hidden_layers": 24,
48
+ "num_key_value_heads": 8,
49
+ "pad_token_id": 0,
50
+ "quantization_config": {
51
+ "config_groups": {
52
+ "group_0": {
53
+ "format": "pack-quantized",
54
+ "input_activations": null,
55
+ "output_activations": null,
56
+ "targets": [
57
+ "Linear"
58
+ ],
59
+ "weights": {
60
+ "actorder": null,
61
+ "block_structure": null,
62
+ "dynamic": false,
63
+ "group_size": 32,
64
+ "num_bits": 4,
65
+ "observer": "mse",
66
+ "observer_kwargs": {},
67
+ "strategy": "group",
68
+ "symmetric": true,
69
+ "type": "int"
70
+ }
71
+ }
72
+ },
73
+ "format": "pack-quantized",
74
+ "global_compression_ratio": null,
75
+ "ignore": [
76
+ "model.layers.0.conv.in_proj",
77
+ "model.layers.0.conv.out_proj",
78
+ "model.layers.0.feed_forward.w1",
79
+ "model.layers.0.feed_forward.w3",
80
+ "model.layers.0.feed_forward.w2",
81
+ "model.layers.1.conv.in_proj",
82
+ "model.layers.1.conv.out_proj",
83
+ "model.layers.1.feed_forward.w1",
84
+ "model.layers.1.feed_forward.w3",
85
+ "model.layers.1.feed_forward.w2",
86
+ "model.layers.2.self_attn.q_proj",
87
+ "model.layers.2.self_attn.k_proj",
88
+ "model.layers.2.self_attn.v_proj",
89
+ "model.layers.2.self_attn.out_proj",
90
+ "model.layers.2.feed_forward.gate",
91
+ "model.layers.3.conv.in_proj",
92
+ "model.layers.3.conv.out_proj",
93
+ "model.layers.3.feed_forward.gate",
94
+ "model.layers.4.conv.in_proj",
95
+ "model.layers.4.conv.out_proj",
96
+ "model.layers.4.feed_forward.gate",
97
+ "model.layers.5.conv.in_proj",
98
+ "model.layers.5.conv.out_proj",
99
+ "model.layers.5.feed_forward.gate",
100
+ "model.layers.6.self_attn.q_proj",
101
+ "model.layers.6.self_attn.k_proj",
102
+ "model.layers.6.self_attn.v_proj",
103
+ "model.layers.6.self_attn.out_proj",
104
+ "model.layers.6.feed_forward.gate",
105
+ "model.layers.7.conv.in_proj",
106
+ "model.layers.7.conv.out_proj",
107
+ "model.layers.7.feed_forward.gate",
108
+ "model.layers.8.conv.in_proj",
109
+ "model.layers.8.conv.out_proj",
110
+ "model.layers.8.feed_forward.gate",
111
+ "model.layers.9.conv.in_proj",
112
+ "model.layers.9.conv.out_proj",
113
+ "model.layers.9.feed_forward.gate",
114
+ "model.layers.10.self_attn.q_proj",
115
+ "model.layers.10.self_attn.k_proj",
116
+ "model.layers.10.self_attn.v_proj",
117
+ "model.layers.10.self_attn.out_proj",
118
+ "model.layers.10.feed_forward.gate",
119
+ "model.layers.11.conv.in_proj",
120
+ "model.layers.11.conv.out_proj",
121
+ "model.layers.11.feed_forward.gate",
122
+ "model.layers.12.conv.in_proj",
123
+ "model.layers.12.conv.out_proj",
124
+ "model.layers.12.feed_forward.gate",
125
+ "model.layers.13.conv.in_proj",
126
+ "model.layers.13.conv.out_proj",
127
+ "model.layers.13.feed_forward.gate",
128
+ "model.layers.14.self_attn.q_proj",
129
+ "model.layers.14.self_attn.k_proj",
130
+ "model.layers.14.self_attn.v_proj",
131
+ "model.layers.14.self_attn.out_proj",
132
+ "model.layers.14.feed_forward.gate",
133
+ "model.layers.15.conv.in_proj",
134
+ "model.layers.15.conv.out_proj",
135
+ "model.layers.15.feed_forward.gate",
136
+ "model.layers.16.conv.in_proj",
137
+ "model.layers.16.conv.out_proj",
138
+ "model.layers.16.feed_forward.gate",
139
+ "model.layers.17.conv.in_proj",
140
+ "model.layers.17.conv.out_proj",
141
+ "model.layers.17.feed_forward.gate",
142
+ "model.layers.18.self_attn.q_proj",
143
+ "model.layers.18.self_attn.k_proj",
144
+ "model.layers.18.self_attn.v_proj",
145
+ "model.layers.18.self_attn.out_proj",
146
+ "model.layers.18.feed_forward.gate",
147
+ "model.layers.19.conv.in_proj",
148
+ "model.layers.19.conv.out_proj",
149
+ "model.layers.19.feed_forward.gate",
150
+ "model.layers.20.conv.in_proj",
151
+ "model.layers.20.conv.out_proj",
152
+ "model.layers.20.feed_forward.gate",
153
+ "model.layers.21.self_attn.q_proj",
154
+ "model.layers.21.self_attn.k_proj",
155
+ "model.layers.21.self_attn.v_proj",
156
+ "model.layers.21.self_attn.out_proj",
157
+ "model.layers.21.feed_forward.gate",
158
+ "model.layers.22.conv.in_proj",
159
+ "model.layers.22.conv.out_proj",
160
+ "model.layers.22.feed_forward.gate",
161
+ "model.layers.23.conv.in_proj",
162
+ "model.layers.23.conv.out_proj",
163
+ "model.layers.23.feed_forward.gate",
164
+ "lm_head"
165
+ ],
166
+ "kv_cache_scheme": null,
167
+ "quant_method": "compressed-tensors",
168
+ "quantization_status": "compressed",
169
+ "sparsity_config": {},
170
+ "transform_config": {},
171
+ "version": "0.12.1.dev0"
172
+ },
173
+ "rope_theta": 1000000.0,
174
+ "routed_scaling_factor": 1.0,
175
+ "tie_word_embeddings": false,
176
+ "transformers_version": "5.0.0.dev0",
177
+ "use_cache": true,
178
+ "use_expert_bias": true,
179
+ "vocab_size": 65536
180
+ }
generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 7,
5
+ "pad_token_id": 0,
6
+ "transformers_version": "5.0.0.dev0"
7
+ }
model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1bc26a92ce848d114389fc9897a79dd7c4ad51fa6d415bd051faa84ff234943
3
+ size 5000348672
model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08ede6d74b6906669a5bf9d0c6531eaf6a140d659ed324cf06741e2b78d3b0e1
3
+ size 806629832
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
recipe.yaml ADDED
@@ -0,0 +1,834 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ default_stage:
2
+ default_modifiers:
3
+ AWQModifier:
4
+ config_groups:
5
+ group_0:
6
+ targets: [Linear]
7
+ weights:
8
+ num_bits: 4
9
+ type: int
10
+ symmetric: true
11
+ group_size: 32
12
+ strategy: group
13
+ block_structure: null
14
+ dynamic: false
15
+ actorder: null
16
+ observer: mse
17
+ observer_kwargs: {}
18
+ input_activations: null
19
+ output_activations: null
20
+ format: null
21
+ targets: [Linear]
22
+ ignore: [model.embed_tokens, model.embedding_norm, 're:model[.]layers[.]0[.].*', 're:model[.]layers[.]1[.].*',
23
+ 're:.*feed_forward[.]gate$', 're:.*ffn_norm$', 're:.*operator_norm$', 're:.*self_attn.*',
24
+ 're:.*conv.*', lm_head]
25
+ mappings:
26
+ - smooth_layer: model.layers.0.operator_norm
27
+ balance_layers: [model.layers.0.conv.in_proj]
28
+ - smooth_layer: model.layers.0.ffn_norm
29
+ balance_layers: [model.layers.0.feed_forward.w1, model.layers.0.feed_forward.w3]
30
+ - smooth_layer: model.layers.1.operator_norm
31
+ balance_layers: [model.layers.1.conv.in_proj]
32
+ - smooth_layer: model.layers.1.ffn_norm
33
+ balance_layers: [model.layers.1.feed_forward.w1, model.layers.1.feed_forward.w3]
34
+ - smooth_layer: model.layers.2.operator_norm
35
+ balance_layers: [model.layers.2.self_attn.q_proj, model.layers.2.self_attn.k_proj,
36
+ model.layers.2.self_attn.v_proj]
37
+ - smooth_layer: model.layers.2.ffn_norm
38
+ balance_layers: [model.layers.2.feed_forward.gate, model.layers.2.feed_forward.experts.0.w1,
39
+ model.layers.2.feed_forward.experts.0.w3, model.layers.2.feed_forward.experts.1.w1,
40
+ model.layers.2.feed_forward.experts.1.w3, model.layers.2.feed_forward.experts.2.w1,
41
+ model.layers.2.feed_forward.experts.2.w3, model.layers.2.feed_forward.experts.3.w1,
42
+ model.layers.2.feed_forward.experts.3.w3, model.layers.2.feed_forward.experts.4.w1,
43
+ model.layers.2.feed_forward.experts.4.w3, model.layers.2.feed_forward.experts.5.w1,
44
+ model.layers.2.feed_forward.experts.5.w3, model.layers.2.feed_forward.experts.6.w1,
45
+ model.layers.2.feed_forward.experts.6.w3, model.layers.2.feed_forward.experts.7.w1,
46
+ model.layers.2.feed_forward.experts.7.w3, model.layers.2.feed_forward.experts.8.w1,
47
+ model.layers.2.feed_forward.experts.8.w3, model.layers.2.feed_forward.experts.9.w1,
48
+ model.layers.2.feed_forward.experts.9.w3, model.layers.2.feed_forward.experts.10.w1,
49
+ model.layers.2.feed_forward.experts.10.w3, model.layers.2.feed_forward.experts.11.w1,
50
+ model.layers.2.feed_forward.experts.11.w3, model.layers.2.feed_forward.experts.12.w1,
51
+ model.layers.2.feed_forward.experts.12.w3, model.layers.2.feed_forward.experts.13.w1,
52
+ model.layers.2.feed_forward.experts.13.w3, model.layers.2.feed_forward.experts.14.w1,
53
+ model.layers.2.feed_forward.experts.14.w3, model.layers.2.feed_forward.experts.15.w1,
54
+ model.layers.2.feed_forward.experts.15.w3, model.layers.2.feed_forward.experts.16.w1,
55
+ model.layers.2.feed_forward.experts.16.w3, model.layers.2.feed_forward.experts.17.w1,
56
+ model.layers.2.feed_forward.experts.17.w3, model.layers.2.feed_forward.experts.18.w1,
57
+ model.layers.2.feed_forward.experts.18.w3, model.layers.2.feed_forward.experts.19.w1,
58
+ model.layers.2.feed_forward.experts.19.w3, model.layers.2.feed_forward.experts.20.w1,
59
+ model.layers.2.feed_forward.experts.20.w3, model.layers.2.feed_forward.experts.21.w1,
60
+ model.layers.2.feed_forward.experts.21.w3, model.layers.2.feed_forward.experts.22.w1,
61
+ model.layers.2.feed_forward.experts.22.w3, model.layers.2.feed_forward.experts.23.w1,
62
+ model.layers.2.feed_forward.experts.23.w3, model.layers.2.feed_forward.experts.24.w1,
63
+ model.layers.2.feed_forward.experts.24.w3, model.layers.2.feed_forward.experts.25.w1,
64
+ model.layers.2.feed_forward.experts.25.w3, model.layers.2.feed_forward.experts.26.w1,
65
+ model.layers.2.feed_forward.experts.26.w3, model.layers.2.feed_forward.experts.27.w1,
66
+ model.layers.2.feed_forward.experts.27.w3, model.layers.2.feed_forward.experts.28.w1,
67
+ model.layers.2.feed_forward.experts.28.w3, model.layers.2.feed_forward.experts.29.w1,
68
+ model.layers.2.feed_forward.experts.29.w3, model.layers.2.feed_forward.experts.30.w1,
69
+ model.layers.2.feed_forward.experts.30.w3, model.layers.2.feed_forward.experts.31.w1,
70
+ model.layers.2.feed_forward.experts.31.w3]
71
+ - smooth_layer: model.layers.3.operator_norm
72
+ balance_layers: [model.layers.3.conv.in_proj]
73
+ - smooth_layer: model.layers.3.ffn_norm
74
+ balance_layers: [model.layers.3.feed_forward.gate, model.layers.3.feed_forward.experts.0.w1,
75
+ model.layers.3.feed_forward.experts.0.w3, model.layers.3.feed_forward.experts.1.w1,
76
+ model.layers.3.feed_forward.experts.1.w3, model.layers.3.feed_forward.experts.2.w1,
77
+ model.layers.3.feed_forward.experts.2.w3, model.layers.3.feed_forward.experts.3.w1,
78
+ model.layers.3.feed_forward.experts.3.w3, model.layers.3.feed_forward.experts.4.w1,
79
+ model.layers.3.feed_forward.experts.4.w3, model.layers.3.feed_forward.experts.5.w1,
80
+ model.layers.3.feed_forward.experts.5.w3, model.layers.3.feed_forward.experts.6.w1,
81
+ model.layers.3.feed_forward.experts.6.w3, model.layers.3.feed_forward.experts.7.w1,
82
+ model.layers.3.feed_forward.experts.7.w3, model.layers.3.feed_forward.experts.8.w1,
83
+ model.layers.3.feed_forward.experts.8.w3, model.layers.3.feed_forward.experts.9.w1,
84
+ model.layers.3.feed_forward.experts.9.w3, model.layers.3.feed_forward.experts.10.w1,
85
+ model.layers.3.feed_forward.experts.10.w3, model.layers.3.feed_forward.experts.11.w1,
86
+ model.layers.3.feed_forward.experts.11.w3, model.layers.3.feed_forward.experts.12.w1,
87
+ model.layers.3.feed_forward.experts.12.w3, model.layers.3.feed_forward.experts.13.w1,
88
+ model.layers.3.feed_forward.experts.13.w3, model.layers.3.feed_forward.experts.14.w1,
89
+ model.layers.3.feed_forward.experts.14.w3, model.layers.3.feed_forward.experts.15.w1,
90
+ model.layers.3.feed_forward.experts.15.w3, model.layers.3.feed_forward.experts.16.w1,
91
+ model.layers.3.feed_forward.experts.16.w3, model.layers.3.feed_forward.experts.17.w1,
92
+ model.layers.3.feed_forward.experts.17.w3, model.layers.3.feed_forward.experts.18.w1,
93
+ model.layers.3.feed_forward.experts.18.w3, model.layers.3.feed_forward.experts.19.w1,
94
+ model.layers.3.feed_forward.experts.19.w3, model.layers.3.feed_forward.experts.20.w1,
95
+ model.layers.3.feed_forward.experts.20.w3, model.layers.3.feed_forward.experts.21.w1,
96
+ model.layers.3.feed_forward.experts.21.w3, model.layers.3.feed_forward.experts.22.w1,
97
+ model.layers.3.feed_forward.experts.22.w3, model.layers.3.feed_forward.experts.23.w1,
98
+ model.layers.3.feed_forward.experts.23.w3, model.layers.3.feed_forward.experts.24.w1,
99
+ model.layers.3.feed_forward.experts.24.w3, model.layers.3.feed_forward.experts.25.w1,
100
+ model.layers.3.feed_forward.experts.25.w3, model.layers.3.feed_forward.experts.26.w1,
101
+ model.layers.3.feed_forward.experts.26.w3, model.layers.3.feed_forward.experts.27.w1,
102
+ model.layers.3.feed_forward.experts.27.w3, model.layers.3.feed_forward.experts.28.w1,
103
+ model.layers.3.feed_forward.experts.28.w3, model.layers.3.feed_forward.experts.29.w1,
104
+ model.layers.3.feed_forward.experts.29.w3, model.layers.3.feed_forward.experts.30.w1,
105
+ model.layers.3.feed_forward.experts.30.w3, model.layers.3.feed_forward.experts.31.w1,
106
+ model.layers.3.feed_forward.experts.31.w3]
107
+ - smooth_layer: model.layers.4.operator_norm
108
+ balance_layers: [model.layers.4.conv.in_proj]
109
+ - smooth_layer: model.layers.4.ffn_norm
110
+ balance_layers: [model.layers.4.feed_forward.gate, model.layers.4.feed_forward.experts.0.w1,
111
+ model.layers.4.feed_forward.experts.0.w3, model.layers.4.feed_forward.experts.1.w1,
112
+ model.layers.4.feed_forward.experts.1.w3, model.layers.4.feed_forward.experts.2.w1,
113
+ model.layers.4.feed_forward.experts.2.w3, model.layers.4.feed_forward.experts.3.w1,
114
+ model.layers.4.feed_forward.experts.3.w3, model.layers.4.feed_forward.experts.4.w1,
115
+ model.layers.4.feed_forward.experts.4.w3, model.layers.4.feed_forward.experts.5.w1,
116
+ model.layers.4.feed_forward.experts.5.w3, model.layers.4.feed_forward.experts.6.w1,
117
+ model.layers.4.feed_forward.experts.6.w3, model.layers.4.feed_forward.experts.7.w1,
118
+ model.layers.4.feed_forward.experts.7.w3, model.layers.4.feed_forward.experts.8.w1,
119
+ model.layers.4.feed_forward.experts.8.w3, model.layers.4.feed_forward.experts.9.w1,
120
+ model.layers.4.feed_forward.experts.9.w3, model.layers.4.feed_forward.experts.10.w1,
121
+ model.layers.4.feed_forward.experts.10.w3, model.layers.4.feed_forward.experts.11.w1,
122
+ model.layers.4.feed_forward.experts.11.w3, model.layers.4.feed_forward.experts.12.w1,
123
+ model.layers.4.feed_forward.experts.12.w3, model.layers.4.feed_forward.experts.13.w1,
124
+ model.layers.4.feed_forward.experts.13.w3, model.layers.4.feed_forward.experts.14.w1,
125
+ model.layers.4.feed_forward.experts.14.w3, model.layers.4.feed_forward.experts.15.w1,
126
+ model.layers.4.feed_forward.experts.15.w3, model.layers.4.feed_forward.experts.16.w1,
127
+ model.layers.4.feed_forward.experts.16.w3, model.layers.4.feed_forward.experts.17.w1,
128
+ model.layers.4.feed_forward.experts.17.w3, model.layers.4.feed_forward.experts.18.w1,
129
+ model.layers.4.feed_forward.experts.18.w3, model.layers.4.feed_forward.experts.19.w1,
130
+ model.layers.4.feed_forward.experts.19.w3, model.layers.4.feed_forward.experts.20.w1,
131
+ model.layers.4.feed_forward.experts.20.w3, model.layers.4.feed_forward.experts.21.w1,
132
+ model.layers.4.feed_forward.experts.21.w3, model.layers.4.feed_forward.experts.22.w1,
133
+ model.layers.4.feed_forward.experts.22.w3, model.layers.4.feed_forward.experts.23.w1,
134
+ model.layers.4.feed_forward.experts.23.w3, model.layers.4.feed_forward.experts.24.w1,
135
+ model.layers.4.feed_forward.experts.24.w3, model.layers.4.feed_forward.experts.25.w1,
136
+ model.layers.4.feed_forward.experts.25.w3, model.layers.4.feed_forward.experts.26.w1,
137
+ model.layers.4.feed_forward.experts.26.w3, model.layers.4.feed_forward.experts.27.w1,
138
+ model.layers.4.feed_forward.experts.27.w3, model.layers.4.feed_forward.experts.28.w1,
139
+ model.layers.4.feed_forward.experts.28.w3, model.layers.4.feed_forward.experts.29.w1,
140
+ model.layers.4.feed_forward.experts.29.w3, model.layers.4.feed_forward.experts.30.w1,
141
+ model.layers.4.feed_forward.experts.30.w3, model.layers.4.feed_forward.experts.31.w1,
142
+ model.layers.4.feed_forward.experts.31.w3]
143
+ - smooth_layer: model.layers.5.operator_norm
144
+ balance_layers: [model.layers.5.conv.in_proj]
145
+ - smooth_layer: model.layers.5.ffn_norm
146
+ balance_layers: [model.layers.5.feed_forward.gate, model.layers.5.feed_forward.experts.0.w1,
147
+ model.layers.5.feed_forward.experts.0.w3, model.layers.5.feed_forward.experts.1.w1,
148
+ model.layers.5.feed_forward.experts.1.w3, model.layers.5.feed_forward.experts.2.w1,
149
+ model.layers.5.feed_forward.experts.2.w3, model.layers.5.feed_forward.experts.3.w1,
150
+ model.layers.5.feed_forward.experts.3.w3, model.layers.5.feed_forward.experts.4.w1,
151
+ model.layers.5.feed_forward.experts.4.w3, model.layers.5.feed_forward.experts.5.w1,
152
+ model.layers.5.feed_forward.experts.5.w3, model.layers.5.feed_forward.experts.6.w1,
153
+ model.layers.5.feed_forward.experts.6.w3, model.layers.5.feed_forward.experts.7.w1,
154
+ model.layers.5.feed_forward.experts.7.w3, model.layers.5.feed_forward.experts.8.w1,
155
+ model.layers.5.feed_forward.experts.8.w3, model.layers.5.feed_forward.experts.9.w1,
156
+ model.layers.5.feed_forward.experts.9.w3, model.layers.5.feed_forward.experts.10.w1,
157
+ model.layers.5.feed_forward.experts.10.w3, model.layers.5.feed_forward.experts.11.w1,
158
+ model.layers.5.feed_forward.experts.11.w3, model.layers.5.feed_forward.experts.12.w1,
159
+ model.layers.5.feed_forward.experts.12.w3, model.layers.5.feed_forward.experts.13.w1,
160
+ model.layers.5.feed_forward.experts.13.w3, model.layers.5.feed_forward.experts.14.w1,
161
+ model.layers.5.feed_forward.experts.14.w3, model.layers.5.feed_forward.experts.15.w1,
162
+ model.layers.5.feed_forward.experts.15.w3, model.layers.5.feed_forward.experts.16.w1,
163
+ model.layers.5.feed_forward.experts.16.w3, model.layers.5.feed_forward.experts.17.w1,
164
+ model.layers.5.feed_forward.experts.17.w3, model.layers.5.feed_forward.experts.18.w1,
165
+ model.layers.5.feed_forward.experts.18.w3, model.layers.5.feed_forward.experts.19.w1,
166
+ model.layers.5.feed_forward.experts.19.w3, model.layers.5.feed_forward.experts.20.w1,
167
+ model.layers.5.feed_forward.experts.20.w3, model.layers.5.feed_forward.experts.21.w1,
168
+ model.layers.5.feed_forward.experts.21.w3, model.layers.5.feed_forward.experts.22.w1,
169
+ model.layers.5.feed_forward.experts.22.w3, model.layers.5.feed_forward.experts.23.w1,
170
+ model.layers.5.feed_forward.experts.23.w3, model.layers.5.feed_forward.experts.24.w1,
171
+ model.layers.5.feed_forward.experts.24.w3, model.layers.5.feed_forward.experts.25.w1,
172
+ model.layers.5.feed_forward.experts.25.w3, model.layers.5.feed_forward.experts.26.w1,
173
+ model.layers.5.feed_forward.experts.26.w3, model.layers.5.feed_forward.experts.27.w1,
174
+ model.layers.5.feed_forward.experts.27.w3, model.layers.5.feed_forward.experts.28.w1,
175
+ model.layers.5.feed_forward.experts.28.w3, model.layers.5.feed_forward.experts.29.w1,
176
+ model.layers.5.feed_forward.experts.29.w3, model.layers.5.feed_forward.experts.30.w1,
177
+ model.layers.5.feed_forward.experts.30.w3, model.layers.5.feed_forward.experts.31.w1,
178
+ model.layers.5.feed_forward.experts.31.w3]
179
+ - smooth_layer: model.layers.6.operator_norm
180
+ balance_layers: [model.layers.6.self_attn.q_proj, model.layers.6.self_attn.k_proj,
181
+ model.layers.6.self_attn.v_proj]
182
+ - smooth_layer: model.layers.6.ffn_norm
183
+ balance_layers: [model.layers.6.feed_forward.gate, model.layers.6.feed_forward.experts.0.w1,
184
+ model.layers.6.feed_forward.experts.0.w3, model.layers.6.feed_forward.experts.1.w1,
185
+ model.layers.6.feed_forward.experts.1.w3, model.layers.6.feed_forward.experts.2.w1,
186
+ model.layers.6.feed_forward.experts.2.w3, model.layers.6.feed_forward.experts.3.w1,
187
+ model.layers.6.feed_forward.experts.3.w3, model.layers.6.feed_forward.experts.4.w1,
188
+ model.layers.6.feed_forward.experts.4.w3, model.layers.6.feed_forward.experts.5.w1,
189
+ model.layers.6.feed_forward.experts.5.w3, model.layers.6.feed_forward.experts.6.w1,
190
+ model.layers.6.feed_forward.experts.6.w3, model.layers.6.feed_forward.experts.7.w1,
191
+ model.layers.6.feed_forward.experts.7.w3, model.layers.6.feed_forward.experts.8.w1,
192
+ model.layers.6.feed_forward.experts.8.w3, model.layers.6.feed_forward.experts.9.w1,
193
+ model.layers.6.feed_forward.experts.9.w3, model.layers.6.feed_forward.experts.10.w1,
194
+ model.layers.6.feed_forward.experts.10.w3, model.layers.6.feed_forward.experts.11.w1,
195
+ model.layers.6.feed_forward.experts.11.w3, model.layers.6.feed_forward.experts.12.w1,
196
+ model.layers.6.feed_forward.experts.12.w3, model.layers.6.feed_forward.experts.13.w1,
197
+ model.layers.6.feed_forward.experts.13.w3, model.layers.6.feed_forward.experts.14.w1,
198
+ model.layers.6.feed_forward.experts.14.w3, model.layers.6.feed_forward.experts.15.w1,
199
+ model.layers.6.feed_forward.experts.15.w3, model.layers.6.feed_forward.experts.16.w1,
200
+ model.layers.6.feed_forward.experts.16.w3, model.layers.6.feed_forward.experts.17.w1,
201
+ model.layers.6.feed_forward.experts.17.w3, model.layers.6.feed_forward.experts.18.w1,
202
+ model.layers.6.feed_forward.experts.18.w3, model.layers.6.feed_forward.experts.19.w1,
203
+ model.layers.6.feed_forward.experts.19.w3, model.layers.6.feed_forward.experts.20.w1,
204
+ model.layers.6.feed_forward.experts.20.w3, model.layers.6.feed_forward.experts.21.w1,
205
+ model.layers.6.feed_forward.experts.21.w3, model.layers.6.feed_forward.experts.22.w1,
206
+ model.layers.6.feed_forward.experts.22.w3, model.layers.6.feed_forward.experts.23.w1,
207
+ model.layers.6.feed_forward.experts.23.w3, model.layers.6.feed_forward.experts.24.w1,
208
+ model.layers.6.feed_forward.experts.24.w3, model.layers.6.feed_forward.experts.25.w1,
209
+ model.layers.6.feed_forward.experts.25.w3, model.layers.6.feed_forward.experts.26.w1,
210
+ model.layers.6.feed_forward.experts.26.w3, model.layers.6.feed_forward.experts.27.w1,
211
+ model.layers.6.feed_forward.experts.27.w3, model.layers.6.feed_forward.experts.28.w1,
212
+ model.layers.6.feed_forward.experts.28.w3, model.layers.6.feed_forward.experts.29.w1,
213
+ model.layers.6.feed_forward.experts.29.w3, model.layers.6.feed_forward.experts.30.w1,
214
+ model.layers.6.feed_forward.experts.30.w3, model.layers.6.feed_forward.experts.31.w1,
215
+ model.layers.6.feed_forward.experts.31.w3]
216
+ - smooth_layer: model.layers.7.operator_norm
217
+ balance_layers: [model.layers.7.conv.in_proj]
218
+ - smooth_layer: model.layers.7.ffn_norm
219
+ balance_layers: [model.layers.7.feed_forward.gate, model.layers.7.feed_forward.experts.0.w1,
220
+ model.layers.7.feed_forward.experts.0.w3, model.layers.7.feed_forward.experts.1.w1,
221
+ model.layers.7.feed_forward.experts.1.w3, model.layers.7.feed_forward.experts.2.w1,
222
+ model.layers.7.feed_forward.experts.2.w3, model.layers.7.feed_forward.experts.3.w1,
223
+ model.layers.7.feed_forward.experts.3.w3, model.layers.7.feed_forward.experts.4.w1,
224
+ model.layers.7.feed_forward.experts.4.w3, model.layers.7.feed_forward.experts.5.w1,
225
+ model.layers.7.feed_forward.experts.5.w3, model.layers.7.feed_forward.experts.6.w1,
226
+ model.layers.7.feed_forward.experts.6.w3, model.layers.7.feed_forward.experts.7.w1,
227
+ model.layers.7.feed_forward.experts.7.w3, model.layers.7.feed_forward.experts.8.w1,
228
+ model.layers.7.feed_forward.experts.8.w3, model.layers.7.feed_forward.experts.9.w1,
229
+ model.layers.7.feed_forward.experts.9.w3, model.layers.7.feed_forward.experts.10.w1,
230
+ model.layers.7.feed_forward.experts.10.w3, model.layers.7.feed_forward.experts.11.w1,
231
+ model.layers.7.feed_forward.experts.11.w3, model.layers.7.feed_forward.experts.12.w1,
232
+ model.layers.7.feed_forward.experts.12.w3, model.layers.7.feed_forward.experts.13.w1,
233
+ model.layers.7.feed_forward.experts.13.w3, model.layers.7.feed_forward.experts.14.w1,
234
+ model.layers.7.feed_forward.experts.14.w3, model.layers.7.feed_forward.experts.15.w1,
235
+ model.layers.7.feed_forward.experts.15.w3, model.layers.7.feed_forward.experts.16.w1,
236
+ model.layers.7.feed_forward.experts.16.w3, model.layers.7.feed_forward.experts.17.w1,
237
+ model.layers.7.feed_forward.experts.17.w3, model.layers.7.feed_forward.experts.18.w1,
238
+ model.layers.7.feed_forward.experts.18.w3, model.layers.7.feed_forward.experts.19.w1,
239
+ model.layers.7.feed_forward.experts.19.w3, model.layers.7.feed_forward.experts.20.w1,
240
+ model.layers.7.feed_forward.experts.20.w3, model.layers.7.feed_forward.experts.21.w1,
241
+ model.layers.7.feed_forward.experts.21.w3, model.layers.7.feed_forward.experts.22.w1,
242
+ model.layers.7.feed_forward.experts.22.w3, model.layers.7.feed_forward.experts.23.w1,
243
+ model.layers.7.feed_forward.experts.23.w3, model.layers.7.feed_forward.experts.24.w1,
244
+ model.layers.7.feed_forward.experts.24.w3, model.layers.7.feed_forward.experts.25.w1,
245
+ model.layers.7.feed_forward.experts.25.w3, model.layers.7.feed_forward.experts.26.w1,
246
+ model.layers.7.feed_forward.experts.26.w3, model.layers.7.feed_forward.experts.27.w1,
247
+ model.layers.7.feed_forward.experts.27.w3, model.layers.7.feed_forward.experts.28.w1,
248
+ model.layers.7.feed_forward.experts.28.w3, model.layers.7.feed_forward.experts.29.w1,
249
+ model.layers.7.feed_forward.experts.29.w3, model.layers.7.feed_forward.experts.30.w1,
250
+ model.layers.7.feed_forward.experts.30.w3, model.layers.7.feed_forward.experts.31.w1,
251
+ model.layers.7.feed_forward.experts.31.w3]
252
+ - smooth_layer: model.layers.8.operator_norm
253
+ balance_layers: [model.layers.8.conv.in_proj]
254
+ - smooth_layer: model.layers.8.ffn_norm
255
+ balance_layers: [model.layers.8.feed_forward.gate, model.layers.8.feed_forward.experts.0.w1,
256
+ model.layers.8.feed_forward.experts.0.w3, model.layers.8.feed_forward.experts.1.w1,
257
+ model.layers.8.feed_forward.experts.1.w3, model.layers.8.feed_forward.experts.2.w1,
258
+ model.layers.8.feed_forward.experts.2.w3, model.layers.8.feed_forward.experts.3.w1,
259
+ model.layers.8.feed_forward.experts.3.w3, model.layers.8.feed_forward.experts.4.w1,
260
+ model.layers.8.feed_forward.experts.4.w3, model.layers.8.feed_forward.experts.5.w1,
261
+ model.layers.8.feed_forward.experts.5.w3, model.layers.8.feed_forward.experts.6.w1,
262
+ model.layers.8.feed_forward.experts.6.w3, model.layers.8.feed_forward.experts.7.w1,
263
+ model.layers.8.feed_forward.experts.7.w3, model.layers.8.feed_forward.experts.8.w1,
264
+ model.layers.8.feed_forward.experts.8.w3, model.layers.8.feed_forward.experts.9.w1,
265
+ model.layers.8.feed_forward.experts.9.w3, model.layers.8.feed_forward.experts.10.w1,
266
+ model.layers.8.feed_forward.experts.10.w3, model.layers.8.feed_forward.experts.11.w1,
267
+ model.layers.8.feed_forward.experts.11.w3, model.layers.8.feed_forward.experts.12.w1,
268
+ model.layers.8.feed_forward.experts.12.w3, model.layers.8.feed_forward.experts.13.w1,
269
+ model.layers.8.feed_forward.experts.13.w3, model.layers.8.feed_forward.experts.14.w1,
270
+ model.layers.8.feed_forward.experts.14.w3, model.layers.8.feed_forward.experts.15.w1,
271
+ model.layers.8.feed_forward.experts.15.w3, model.layers.8.feed_forward.experts.16.w1,
272
+ model.layers.8.feed_forward.experts.16.w3, model.layers.8.feed_forward.experts.17.w1,
273
+ model.layers.8.feed_forward.experts.17.w3, model.layers.8.feed_forward.experts.18.w1,
274
+ model.layers.8.feed_forward.experts.18.w3, model.layers.8.feed_forward.experts.19.w1,
275
+ model.layers.8.feed_forward.experts.19.w3, model.layers.8.feed_forward.experts.20.w1,
276
+ model.layers.8.feed_forward.experts.20.w3, model.layers.8.feed_forward.experts.21.w1,
277
+ model.layers.8.feed_forward.experts.21.w3, model.layers.8.feed_forward.experts.22.w1,
278
+ model.layers.8.feed_forward.experts.22.w3, model.layers.8.feed_forward.experts.23.w1,
279
+ model.layers.8.feed_forward.experts.23.w3, model.layers.8.feed_forward.experts.24.w1,
280
+ model.layers.8.feed_forward.experts.24.w3, model.layers.8.feed_forward.experts.25.w1,
281
+ model.layers.8.feed_forward.experts.25.w3, model.layers.8.feed_forward.experts.26.w1,
282
+ model.layers.8.feed_forward.experts.26.w3, model.layers.8.feed_forward.experts.27.w1,
283
+ model.layers.8.feed_forward.experts.27.w3, model.layers.8.feed_forward.experts.28.w1,
284
+ model.layers.8.feed_forward.experts.28.w3, model.layers.8.feed_forward.experts.29.w1,
285
+ model.layers.8.feed_forward.experts.29.w3, model.layers.8.feed_forward.experts.30.w1,
286
+ model.layers.8.feed_forward.experts.30.w3, model.layers.8.feed_forward.experts.31.w1,
287
+ model.layers.8.feed_forward.experts.31.w3]
288
+ - smooth_layer: model.layers.9.operator_norm
289
+ balance_layers: [model.layers.9.conv.in_proj]
290
+ - smooth_layer: model.layers.9.ffn_norm
291
+ balance_layers: [model.layers.9.feed_forward.gate, model.layers.9.feed_forward.experts.0.w1,
292
+ model.layers.9.feed_forward.experts.0.w3, model.layers.9.feed_forward.experts.1.w1,
293
+ model.layers.9.feed_forward.experts.1.w3, model.layers.9.feed_forward.experts.2.w1,
294
+ model.layers.9.feed_forward.experts.2.w3, model.layers.9.feed_forward.experts.3.w1,
295
+ model.layers.9.feed_forward.experts.3.w3, model.layers.9.feed_forward.experts.4.w1,
296
+ model.layers.9.feed_forward.experts.4.w3, model.layers.9.feed_forward.experts.5.w1,
297
+ model.layers.9.feed_forward.experts.5.w3, model.layers.9.feed_forward.experts.6.w1,
298
+ model.layers.9.feed_forward.experts.6.w3, model.layers.9.feed_forward.experts.7.w1,
299
+ model.layers.9.feed_forward.experts.7.w3, model.layers.9.feed_forward.experts.8.w1,
300
+ model.layers.9.feed_forward.experts.8.w3, model.layers.9.feed_forward.experts.9.w1,
301
+ model.layers.9.feed_forward.experts.9.w3, model.layers.9.feed_forward.experts.10.w1,
302
+ model.layers.9.feed_forward.experts.10.w3, model.layers.9.feed_forward.experts.11.w1,
303
+ model.layers.9.feed_forward.experts.11.w3, model.layers.9.feed_forward.experts.12.w1,
304
+ model.layers.9.feed_forward.experts.12.w3, model.layers.9.feed_forward.experts.13.w1,
305
+ model.layers.9.feed_forward.experts.13.w3, model.layers.9.feed_forward.experts.14.w1,
306
+ model.layers.9.feed_forward.experts.14.w3, model.layers.9.feed_forward.experts.15.w1,
307
+ model.layers.9.feed_forward.experts.15.w3, model.layers.9.feed_forward.experts.16.w1,
308
+ model.layers.9.feed_forward.experts.16.w3, model.layers.9.feed_forward.experts.17.w1,
309
+ model.layers.9.feed_forward.experts.17.w3, model.layers.9.feed_forward.experts.18.w1,
310
+ model.layers.9.feed_forward.experts.18.w3, model.layers.9.feed_forward.experts.19.w1,
311
+ model.layers.9.feed_forward.experts.19.w3, model.layers.9.feed_forward.experts.20.w1,
312
+ model.layers.9.feed_forward.experts.20.w3, model.layers.9.feed_forward.experts.21.w1,
313
+ model.layers.9.feed_forward.experts.21.w3, model.layers.9.feed_forward.experts.22.w1,
314
+ model.layers.9.feed_forward.experts.22.w3, model.layers.9.feed_forward.experts.23.w1,
315
+ model.layers.9.feed_forward.experts.23.w3, model.layers.9.feed_forward.experts.24.w1,
316
+ model.layers.9.feed_forward.experts.24.w3, model.layers.9.feed_forward.experts.25.w1,
317
+ model.layers.9.feed_forward.experts.25.w3, model.layers.9.feed_forward.experts.26.w1,
318
+ model.layers.9.feed_forward.experts.26.w3, model.layers.9.feed_forward.experts.27.w1,
319
+ model.layers.9.feed_forward.experts.27.w3, model.layers.9.feed_forward.experts.28.w1,
320
+ model.layers.9.feed_forward.experts.28.w3, model.layers.9.feed_forward.experts.29.w1,
321
+ model.layers.9.feed_forward.experts.29.w3, model.layers.9.feed_forward.experts.30.w1,
322
+ model.layers.9.feed_forward.experts.30.w3, model.layers.9.feed_forward.experts.31.w1,
323
+ model.layers.9.feed_forward.experts.31.w3]
324
+ - smooth_layer: model.layers.10.operator_norm
325
+ balance_layers: [model.layers.10.self_attn.q_proj, model.layers.10.self_attn.k_proj,
326
+ model.layers.10.self_attn.v_proj]
327
+ - smooth_layer: model.layers.10.ffn_norm
328
+ balance_layers: [model.layers.10.feed_forward.gate, model.layers.10.feed_forward.experts.0.w1,
329
+ model.layers.10.feed_forward.experts.0.w3, model.layers.10.feed_forward.experts.1.w1,
330
+ model.layers.10.feed_forward.experts.1.w3, model.layers.10.feed_forward.experts.2.w1,
331
+ model.layers.10.feed_forward.experts.2.w3, model.layers.10.feed_forward.experts.3.w1,
332
+ model.layers.10.feed_forward.experts.3.w3, model.layers.10.feed_forward.experts.4.w1,
333
+ model.layers.10.feed_forward.experts.4.w3, model.layers.10.feed_forward.experts.5.w1,
334
+ model.layers.10.feed_forward.experts.5.w3, model.layers.10.feed_forward.experts.6.w1,
335
+ model.layers.10.feed_forward.experts.6.w3, model.layers.10.feed_forward.experts.7.w1,
336
+ model.layers.10.feed_forward.experts.7.w3, model.layers.10.feed_forward.experts.8.w1,
337
+ model.layers.10.feed_forward.experts.8.w3, model.layers.10.feed_forward.experts.9.w1,
338
+ model.layers.10.feed_forward.experts.9.w3, model.layers.10.feed_forward.experts.10.w1,
339
+ model.layers.10.feed_forward.experts.10.w3, model.layers.10.feed_forward.experts.11.w1,
340
+ model.layers.10.feed_forward.experts.11.w3, model.layers.10.feed_forward.experts.12.w1,
341
+ model.layers.10.feed_forward.experts.12.w3, model.layers.10.feed_forward.experts.13.w1,
342
+ model.layers.10.feed_forward.experts.13.w3, model.layers.10.feed_forward.experts.14.w1,
343
+ model.layers.10.feed_forward.experts.14.w3, model.layers.10.feed_forward.experts.15.w1,
344
+ model.layers.10.feed_forward.experts.15.w3, model.layers.10.feed_forward.experts.16.w1,
345
+ model.layers.10.feed_forward.experts.16.w3, model.layers.10.feed_forward.experts.17.w1,
346
+ model.layers.10.feed_forward.experts.17.w3, model.layers.10.feed_forward.experts.18.w1,
347
+ model.layers.10.feed_forward.experts.18.w3, model.layers.10.feed_forward.experts.19.w1,
348
+ model.layers.10.feed_forward.experts.19.w3, model.layers.10.feed_forward.experts.20.w1,
349
+ model.layers.10.feed_forward.experts.20.w3, model.layers.10.feed_forward.experts.21.w1,
350
+ model.layers.10.feed_forward.experts.21.w3, model.layers.10.feed_forward.experts.22.w1,
351
+ model.layers.10.feed_forward.experts.22.w3, model.layers.10.feed_forward.experts.23.w1,
352
+ model.layers.10.feed_forward.experts.23.w3, model.layers.10.feed_forward.experts.24.w1,
353
+ model.layers.10.feed_forward.experts.24.w3, model.layers.10.feed_forward.experts.25.w1,
354
+ model.layers.10.feed_forward.experts.25.w3, model.layers.10.feed_forward.experts.26.w1,
355
+ model.layers.10.feed_forward.experts.26.w3, model.layers.10.feed_forward.experts.27.w1,
356
+ model.layers.10.feed_forward.experts.27.w3, model.layers.10.feed_forward.experts.28.w1,
357
+ model.layers.10.feed_forward.experts.28.w3, model.layers.10.feed_forward.experts.29.w1,
358
+ model.layers.10.feed_forward.experts.29.w3, model.layers.10.feed_forward.experts.30.w1,
359
+ model.layers.10.feed_forward.experts.30.w3, model.layers.10.feed_forward.experts.31.w1,
360
+ model.layers.10.feed_forward.experts.31.w3]
361
+ - smooth_layer: model.layers.11.operator_norm
362
+ balance_layers: [model.layers.11.conv.in_proj]
363
+ - smooth_layer: model.layers.11.ffn_norm
364
+ balance_layers: [model.layers.11.feed_forward.gate, model.layers.11.feed_forward.experts.0.w1,
365
+ model.layers.11.feed_forward.experts.0.w3, model.layers.11.feed_forward.experts.1.w1,
366
+ model.layers.11.feed_forward.experts.1.w3, model.layers.11.feed_forward.experts.2.w1,
367
+ model.layers.11.feed_forward.experts.2.w3, model.layers.11.feed_forward.experts.3.w1,
368
+ model.layers.11.feed_forward.experts.3.w3, model.layers.11.feed_forward.experts.4.w1,
369
+ model.layers.11.feed_forward.experts.4.w3, model.layers.11.feed_forward.experts.5.w1,
370
+ model.layers.11.feed_forward.experts.5.w3, model.layers.11.feed_forward.experts.6.w1,
371
+ model.layers.11.feed_forward.experts.6.w3, model.layers.11.feed_forward.experts.7.w1,
372
+ model.layers.11.feed_forward.experts.7.w3, model.layers.11.feed_forward.experts.8.w1,
373
+ model.layers.11.feed_forward.experts.8.w3, model.layers.11.feed_forward.experts.9.w1,
374
+ model.layers.11.feed_forward.experts.9.w3, model.layers.11.feed_forward.experts.10.w1,
375
+ model.layers.11.feed_forward.experts.10.w3, model.layers.11.feed_forward.experts.11.w1,
376
+ model.layers.11.feed_forward.experts.11.w3, model.layers.11.feed_forward.experts.12.w1,
377
+ model.layers.11.feed_forward.experts.12.w3, model.layers.11.feed_forward.experts.13.w1,
378
+ model.layers.11.feed_forward.experts.13.w3, model.layers.11.feed_forward.experts.14.w1,
379
+ model.layers.11.feed_forward.experts.14.w3, model.layers.11.feed_forward.experts.15.w1,
380
+ model.layers.11.feed_forward.experts.15.w3, model.layers.11.feed_forward.experts.16.w1,
381
+ model.layers.11.feed_forward.experts.16.w3, model.layers.11.feed_forward.experts.17.w1,
382
+ model.layers.11.feed_forward.experts.17.w3, model.layers.11.feed_forward.experts.18.w1,
383
+ model.layers.11.feed_forward.experts.18.w3, model.layers.11.feed_forward.experts.19.w1,
384
+ model.layers.11.feed_forward.experts.19.w3, model.layers.11.feed_forward.experts.20.w1,
385
+ model.layers.11.feed_forward.experts.20.w3, model.layers.11.feed_forward.experts.21.w1,
386
+ model.layers.11.feed_forward.experts.21.w3, model.layers.11.feed_forward.experts.22.w1,
387
+ model.layers.11.feed_forward.experts.22.w3, model.layers.11.feed_forward.experts.23.w1,
388
+ model.layers.11.feed_forward.experts.23.w3, model.layers.11.feed_forward.experts.24.w1,
389
+ model.layers.11.feed_forward.experts.24.w3, model.layers.11.feed_forward.experts.25.w1,
390
+ model.layers.11.feed_forward.experts.25.w3, model.layers.11.feed_forward.experts.26.w1,
391
+ model.layers.11.feed_forward.experts.26.w3, model.layers.11.feed_forward.experts.27.w1,
392
+ model.layers.11.feed_forward.experts.27.w3, model.layers.11.feed_forward.experts.28.w1,
393
+ model.layers.11.feed_forward.experts.28.w3, model.layers.11.feed_forward.experts.29.w1,
394
+ model.layers.11.feed_forward.experts.29.w3, model.layers.11.feed_forward.experts.30.w1,
395
+ model.layers.11.feed_forward.experts.30.w3, model.layers.11.feed_forward.experts.31.w1,
396
+ model.layers.11.feed_forward.experts.31.w3]
397
+ - smooth_layer: model.layers.12.operator_norm
398
+ balance_layers: [model.layers.12.conv.in_proj]
399
+ - smooth_layer: model.layers.12.ffn_norm
400
+ balance_layers: [model.layers.12.feed_forward.gate, model.layers.12.feed_forward.experts.0.w1,
401
+ model.layers.12.feed_forward.experts.0.w3, model.layers.12.feed_forward.experts.1.w1,
402
+ model.layers.12.feed_forward.experts.1.w3, model.layers.12.feed_forward.experts.2.w1,
403
+ model.layers.12.feed_forward.experts.2.w3, model.layers.12.feed_forward.experts.3.w1,
404
+ model.layers.12.feed_forward.experts.3.w3, model.layers.12.feed_forward.experts.4.w1,
405
+ model.layers.12.feed_forward.experts.4.w3, model.layers.12.feed_forward.experts.5.w1,
406
+ model.layers.12.feed_forward.experts.5.w3, model.layers.12.feed_forward.experts.6.w1,
407
+ model.layers.12.feed_forward.experts.6.w3, model.layers.12.feed_forward.experts.7.w1,
408
+ model.layers.12.feed_forward.experts.7.w3, model.layers.12.feed_forward.experts.8.w1,
409
+ model.layers.12.feed_forward.experts.8.w3, model.layers.12.feed_forward.experts.9.w1,
410
+ model.layers.12.feed_forward.experts.9.w3, model.layers.12.feed_forward.experts.10.w1,
411
+ model.layers.12.feed_forward.experts.10.w3, model.layers.12.feed_forward.experts.11.w1,
412
+ model.layers.12.feed_forward.experts.11.w3, model.layers.12.feed_forward.experts.12.w1,
413
+ model.layers.12.feed_forward.experts.12.w3, model.layers.12.feed_forward.experts.13.w1,
414
+ model.layers.12.feed_forward.experts.13.w3, model.layers.12.feed_forward.experts.14.w1,
415
+ model.layers.12.feed_forward.experts.14.w3, model.layers.12.feed_forward.experts.15.w1,
416
+ model.layers.12.feed_forward.experts.15.w3, model.layers.12.feed_forward.experts.16.w1,
417
+ model.layers.12.feed_forward.experts.16.w3, model.layers.12.feed_forward.experts.17.w1,
418
+ model.layers.12.feed_forward.experts.17.w3, model.layers.12.feed_forward.experts.18.w1,
419
+ model.layers.12.feed_forward.experts.18.w3, model.layers.12.feed_forward.experts.19.w1,
420
+ model.layers.12.feed_forward.experts.19.w3, model.layers.12.feed_forward.experts.20.w1,
421
+ model.layers.12.feed_forward.experts.20.w3, model.layers.12.feed_forward.experts.21.w1,
422
+ model.layers.12.feed_forward.experts.21.w3, model.layers.12.feed_forward.experts.22.w1,
423
+ model.layers.12.feed_forward.experts.22.w3, model.layers.12.feed_forward.experts.23.w1,
424
+ model.layers.12.feed_forward.experts.23.w3, model.layers.12.feed_forward.experts.24.w1,
425
+ model.layers.12.feed_forward.experts.24.w3, model.layers.12.feed_forward.experts.25.w1,
426
+ model.layers.12.feed_forward.experts.25.w3, model.layers.12.feed_forward.experts.26.w1,
427
+ model.layers.12.feed_forward.experts.26.w3, model.layers.12.feed_forward.experts.27.w1,
428
+ model.layers.12.feed_forward.experts.27.w3, model.layers.12.feed_forward.experts.28.w1,
429
+ model.layers.12.feed_forward.experts.28.w3, model.layers.12.feed_forward.experts.29.w1,
430
+ model.layers.12.feed_forward.experts.29.w3, model.layers.12.feed_forward.experts.30.w1,
431
+ model.layers.12.feed_forward.experts.30.w3, model.layers.12.feed_forward.experts.31.w1,
432
+ model.layers.12.feed_forward.experts.31.w3]
433
+ - smooth_layer: model.layers.13.operator_norm
434
+ balance_layers: [model.layers.13.conv.in_proj]
435
+ - smooth_layer: model.layers.13.ffn_norm
436
+ balance_layers: [model.layers.13.feed_forward.gate, model.layers.13.feed_forward.experts.0.w1,
437
+ model.layers.13.feed_forward.experts.0.w3, model.layers.13.feed_forward.experts.1.w1,
438
+ model.layers.13.feed_forward.experts.1.w3, model.layers.13.feed_forward.experts.2.w1,
439
+ model.layers.13.feed_forward.experts.2.w3, model.layers.13.feed_forward.experts.3.w1,
440
+ model.layers.13.feed_forward.experts.3.w3, model.layers.13.feed_forward.experts.4.w1,
441
+ model.layers.13.feed_forward.experts.4.w3, model.layers.13.feed_forward.experts.5.w1,
442
+ model.layers.13.feed_forward.experts.5.w3, model.layers.13.feed_forward.experts.6.w1,
443
+ model.layers.13.feed_forward.experts.6.w3, model.layers.13.feed_forward.experts.7.w1,
444
+ model.layers.13.feed_forward.experts.7.w3, model.layers.13.feed_forward.experts.8.w1,
445
+ model.layers.13.feed_forward.experts.8.w3, model.layers.13.feed_forward.experts.9.w1,
446
+ model.layers.13.feed_forward.experts.9.w3, model.layers.13.feed_forward.experts.10.w1,
447
+ model.layers.13.feed_forward.experts.10.w3, model.layers.13.feed_forward.experts.11.w1,
448
+ model.layers.13.feed_forward.experts.11.w3, model.layers.13.feed_forward.experts.12.w1,
449
+ model.layers.13.feed_forward.experts.12.w3, model.layers.13.feed_forward.experts.13.w1,
450
+ model.layers.13.feed_forward.experts.13.w3, model.layers.13.feed_forward.experts.14.w1,
451
+ model.layers.13.feed_forward.experts.14.w3, model.layers.13.feed_forward.experts.15.w1,
452
+ model.layers.13.feed_forward.experts.15.w3, model.layers.13.feed_forward.experts.16.w1,
453
+ model.layers.13.feed_forward.experts.16.w3, model.layers.13.feed_forward.experts.17.w1,
454
+ model.layers.13.feed_forward.experts.17.w3, model.layers.13.feed_forward.experts.18.w1,
455
+ model.layers.13.feed_forward.experts.18.w3, model.layers.13.feed_forward.experts.19.w1,
456
+ model.layers.13.feed_forward.experts.19.w3, model.layers.13.feed_forward.experts.20.w1,
457
+ model.layers.13.feed_forward.experts.20.w3, model.layers.13.feed_forward.experts.21.w1,
458
+ model.layers.13.feed_forward.experts.21.w3, model.layers.13.feed_forward.experts.22.w1,
459
+ model.layers.13.feed_forward.experts.22.w3, model.layers.13.feed_forward.experts.23.w1,
460
+ model.layers.13.feed_forward.experts.23.w3, model.layers.13.feed_forward.experts.24.w1,
461
+ model.layers.13.feed_forward.experts.24.w3, model.layers.13.feed_forward.experts.25.w1,
462
+ model.layers.13.feed_forward.experts.25.w3, model.layers.13.feed_forward.experts.26.w1,
463
+ model.layers.13.feed_forward.experts.26.w3, model.layers.13.feed_forward.experts.27.w1,
464
+ model.layers.13.feed_forward.experts.27.w3, model.layers.13.feed_forward.experts.28.w1,
465
+ model.layers.13.feed_forward.experts.28.w3, model.layers.13.feed_forward.experts.29.w1,
466
+ model.layers.13.feed_forward.experts.29.w3, model.layers.13.feed_forward.experts.30.w1,
467
+ model.layers.13.feed_forward.experts.30.w3, model.layers.13.feed_forward.experts.31.w1,
468
+ model.layers.13.feed_forward.experts.31.w3]
469
+ - smooth_layer: model.layers.14.operator_norm
470
+ balance_layers: [model.layers.14.self_attn.q_proj, model.layers.14.self_attn.k_proj,
471
+ model.layers.14.self_attn.v_proj]
472
+ - smooth_layer: model.layers.14.ffn_norm
473
+ balance_layers: [model.layers.14.feed_forward.gate, model.layers.14.feed_forward.experts.0.w1,
474
+ model.layers.14.feed_forward.experts.0.w3, model.layers.14.feed_forward.experts.1.w1,
475
+ model.layers.14.feed_forward.experts.1.w3, model.layers.14.feed_forward.experts.2.w1,
476
+ model.layers.14.feed_forward.experts.2.w3, model.layers.14.feed_forward.experts.3.w1,
477
+ model.layers.14.feed_forward.experts.3.w3, model.layers.14.feed_forward.experts.4.w1,
478
+ model.layers.14.feed_forward.experts.4.w3, model.layers.14.feed_forward.experts.5.w1,
479
+ model.layers.14.feed_forward.experts.5.w3, model.layers.14.feed_forward.experts.6.w1,
480
+ model.layers.14.feed_forward.experts.6.w3, model.layers.14.feed_forward.experts.7.w1,
481
+ model.layers.14.feed_forward.experts.7.w3, model.layers.14.feed_forward.experts.8.w1,
482
+ model.layers.14.feed_forward.experts.8.w3, model.layers.14.feed_forward.experts.9.w1,
483
+ model.layers.14.feed_forward.experts.9.w3, model.layers.14.feed_forward.experts.10.w1,
484
+ model.layers.14.feed_forward.experts.10.w3, model.layers.14.feed_forward.experts.11.w1,
485
+ model.layers.14.feed_forward.experts.11.w3, model.layers.14.feed_forward.experts.12.w1,
486
+ model.layers.14.feed_forward.experts.12.w3, model.layers.14.feed_forward.experts.13.w1,
487
+ model.layers.14.feed_forward.experts.13.w3, model.layers.14.feed_forward.experts.14.w1,
488
+ model.layers.14.feed_forward.experts.14.w3, model.layers.14.feed_forward.experts.15.w1,
489
+ model.layers.14.feed_forward.experts.15.w3, model.layers.14.feed_forward.experts.16.w1,
490
+ model.layers.14.feed_forward.experts.16.w3, model.layers.14.feed_forward.experts.17.w1,
491
+ model.layers.14.feed_forward.experts.17.w3, model.layers.14.feed_forward.experts.18.w1,
492
+ model.layers.14.feed_forward.experts.18.w3, model.layers.14.feed_forward.experts.19.w1,
493
+ model.layers.14.feed_forward.experts.19.w3, model.layers.14.feed_forward.experts.20.w1,
494
+ model.layers.14.feed_forward.experts.20.w3, model.layers.14.feed_forward.experts.21.w1,
495
+ model.layers.14.feed_forward.experts.21.w3, model.layers.14.feed_forward.experts.22.w1,
496
+ model.layers.14.feed_forward.experts.22.w3, model.layers.14.feed_forward.experts.23.w1,
497
+ model.layers.14.feed_forward.experts.23.w3, model.layers.14.feed_forward.experts.24.w1,
498
+ model.layers.14.feed_forward.experts.24.w3, model.layers.14.feed_forward.experts.25.w1,
499
+ model.layers.14.feed_forward.experts.25.w3, model.layers.14.feed_forward.experts.26.w1,
500
+ model.layers.14.feed_forward.experts.26.w3, model.layers.14.feed_forward.experts.27.w1,
501
+ model.layers.14.feed_forward.experts.27.w3, model.layers.14.feed_forward.experts.28.w1,
502
+ model.layers.14.feed_forward.experts.28.w3, model.layers.14.feed_forward.experts.29.w1,
503
+ model.layers.14.feed_forward.experts.29.w3, model.layers.14.feed_forward.experts.30.w1,
504
+ model.layers.14.feed_forward.experts.30.w3, model.layers.14.feed_forward.experts.31.w1,
505
+ model.layers.14.feed_forward.experts.31.w3]
506
+ - smooth_layer: model.layers.15.operator_norm
507
+ balance_layers: [model.layers.15.conv.in_proj]
508
+ - smooth_layer: model.layers.15.ffn_norm
509
+ balance_layers: [model.layers.15.feed_forward.gate, model.layers.15.feed_forward.experts.0.w1,
510
+ model.layers.15.feed_forward.experts.0.w3, model.layers.15.feed_forward.experts.1.w1,
511
+ model.layers.15.feed_forward.experts.1.w3, model.layers.15.feed_forward.experts.2.w1,
512
+ model.layers.15.feed_forward.experts.2.w3, model.layers.15.feed_forward.experts.3.w1,
513
+ model.layers.15.feed_forward.experts.3.w3, model.layers.15.feed_forward.experts.4.w1,
514
+ model.layers.15.feed_forward.experts.4.w3, model.layers.15.feed_forward.experts.5.w1,
515
+ model.layers.15.feed_forward.experts.5.w3, model.layers.15.feed_forward.experts.6.w1,
516
+ model.layers.15.feed_forward.experts.6.w3, model.layers.15.feed_forward.experts.7.w1,
517
+ model.layers.15.feed_forward.experts.7.w3, model.layers.15.feed_forward.experts.8.w1,
518
+ model.layers.15.feed_forward.experts.8.w3, model.layers.15.feed_forward.experts.9.w1,
519
+ model.layers.15.feed_forward.experts.9.w3, model.layers.15.feed_forward.experts.10.w1,
520
+ model.layers.15.feed_forward.experts.10.w3, model.layers.15.feed_forward.experts.11.w1,
521
+ model.layers.15.feed_forward.experts.11.w3, model.layers.15.feed_forward.experts.12.w1,
522
+ model.layers.15.feed_forward.experts.12.w3, model.layers.15.feed_forward.experts.13.w1,
523
+ model.layers.15.feed_forward.experts.13.w3, model.layers.15.feed_forward.experts.14.w1,
524
+ model.layers.15.feed_forward.experts.14.w3, model.layers.15.feed_forward.experts.15.w1,
525
+ model.layers.15.feed_forward.experts.15.w3, model.layers.15.feed_forward.experts.16.w1,
526
+ model.layers.15.feed_forward.experts.16.w3, model.layers.15.feed_forward.experts.17.w1,
527
+ model.layers.15.feed_forward.experts.17.w3, model.layers.15.feed_forward.experts.18.w1,
528
+ model.layers.15.feed_forward.experts.18.w3, model.layers.15.feed_forward.experts.19.w1,
529
+ model.layers.15.feed_forward.experts.19.w3, model.layers.15.feed_forward.experts.20.w1,
530
+ model.layers.15.feed_forward.experts.20.w3, model.layers.15.feed_forward.experts.21.w1,
531
+ model.layers.15.feed_forward.experts.21.w3, model.layers.15.feed_forward.experts.22.w1,
532
+ model.layers.15.feed_forward.experts.22.w3, model.layers.15.feed_forward.experts.23.w1,
533
+ model.layers.15.feed_forward.experts.23.w3, model.layers.15.feed_forward.experts.24.w1,
534
+ model.layers.15.feed_forward.experts.24.w3, model.layers.15.feed_forward.experts.25.w1,
535
+ model.layers.15.feed_forward.experts.25.w3, model.layers.15.feed_forward.experts.26.w1,
536
+ model.layers.15.feed_forward.experts.26.w3, model.layers.15.feed_forward.experts.27.w1,
537
+ model.layers.15.feed_forward.experts.27.w3, model.layers.15.feed_forward.experts.28.w1,
538
+ model.layers.15.feed_forward.experts.28.w3, model.layers.15.feed_forward.experts.29.w1,
539
+ model.layers.15.feed_forward.experts.29.w3, model.layers.15.feed_forward.experts.30.w1,
540
+ model.layers.15.feed_forward.experts.30.w3, model.layers.15.feed_forward.experts.31.w1,
541
+ model.layers.15.feed_forward.experts.31.w3]
542
+ - smooth_layer: model.layers.16.operator_norm
543
+ balance_layers: [model.layers.16.conv.in_proj]
544
+ - smooth_layer: model.layers.16.ffn_norm
545
+ balance_layers: [model.layers.16.feed_forward.gate, model.layers.16.feed_forward.experts.0.w1,
546
+ model.layers.16.feed_forward.experts.0.w3, model.layers.16.feed_forward.experts.1.w1,
547
+ model.layers.16.feed_forward.experts.1.w3, model.layers.16.feed_forward.experts.2.w1,
548
+ model.layers.16.feed_forward.experts.2.w3, model.layers.16.feed_forward.experts.3.w1,
549
+ model.layers.16.feed_forward.experts.3.w3, model.layers.16.feed_forward.experts.4.w1,
550
+ model.layers.16.feed_forward.experts.4.w3, model.layers.16.feed_forward.experts.5.w1,
551
+ model.layers.16.feed_forward.experts.5.w3, model.layers.16.feed_forward.experts.6.w1,
552
+ model.layers.16.feed_forward.experts.6.w3, model.layers.16.feed_forward.experts.7.w1,
553
+ model.layers.16.feed_forward.experts.7.w3, model.layers.16.feed_forward.experts.8.w1,
554
+ model.layers.16.feed_forward.experts.8.w3, model.layers.16.feed_forward.experts.9.w1,
555
+ model.layers.16.feed_forward.experts.9.w3, model.layers.16.feed_forward.experts.10.w1,
556
+ model.layers.16.feed_forward.experts.10.w3, model.layers.16.feed_forward.experts.11.w1,
557
+ model.layers.16.feed_forward.experts.11.w3, model.layers.16.feed_forward.experts.12.w1,
558
+ model.layers.16.feed_forward.experts.12.w3, model.layers.16.feed_forward.experts.13.w1,
559
+ model.layers.16.feed_forward.experts.13.w3, model.layers.16.feed_forward.experts.14.w1,
560
+ model.layers.16.feed_forward.experts.14.w3, model.layers.16.feed_forward.experts.15.w1,
561
+ model.layers.16.feed_forward.experts.15.w3, model.layers.16.feed_forward.experts.16.w1,
562
+ model.layers.16.feed_forward.experts.16.w3, model.layers.16.feed_forward.experts.17.w1,
563
+ model.layers.16.feed_forward.experts.17.w3, model.layers.16.feed_forward.experts.18.w1,
564
+ model.layers.16.feed_forward.experts.18.w3, model.layers.16.feed_forward.experts.19.w1,
565
+ model.layers.16.feed_forward.experts.19.w3, model.layers.16.feed_forward.experts.20.w1,
566
+ model.layers.16.feed_forward.experts.20.w3, model.layers.16.feed_forward.experts.21.w1,
567
+ model.layers.16.feed_forward.experts.21.w3, model.layers.16.feed_forward.experts.22.w1,
568
+ model.layers.16.feed_forward.experts.22.w3, model.layers.16.feed_forward.experts.23.w1,
569
+ model.layers.16.feed_forward.experts.23.w3, model.layers.16.feed_forward.experts.24.w1,
570
+ model.layers.16.feed_forward.experts.24.w3, model.layers.16.feed_forward.experts.25.w1,
571
+ model.layers.16.feed_forward.experts.25.w3, model.layers.16.feed_forward.experts.26.w1,
572
+ model.layers.16.feed_forward.experts.26.w3, model.layers.16.feed_forward.experts.27.w1,
573
+ model.layers.16.feed_forward.experts.27.w3, model.layers.16.feed_forward.experts.28.w1,
574
+ model.layers.16.feed_forward.experts.28.w3, model.layers.16.feed_forward.experts.29.w1,
575
+ model.layers.16.feed_forward.experts.29.w3, model.layers.16.feed_forward.experts.30.w1,
576
+ model.layers.16.feed_forward.experts.30.w3, model.layers.16.feed_forward.experts.31.w1,
577
+ model.layers.16.feed_forward.experts.31.w3]
578
+ - smooth_layer: model.layers.17.operator_norm
579
+ balance_layers: [model.layers.17.conv.in_proj]
580
+ - smooth_layer: model.layers.17.ffn_norm
581
+ balance_layers: [model.layers.17.feed_forward.gate, model.layers.17.feed_forward.experts.0.w1,
582
+ model.layers.17.feed_forward.experts.0.w3, model.layers.17.feed_forward.experts.1.w1,
583
+ model.layers.17.feed_forward.experts.1.w3, model.layers.17.feed_forward.experts.2.w1,
584
+ model.layers.17.feed_forward.experts.2.w3, model.layers.17.feed_forward.experts.3.w1,
585
+ model.layers.17.feed_forward.experts.3.w3, model.layers.17.feed_forward.experts.4.w1,
586
+ model.layers.17.feed_forward.experts.4.w3, model.layers.17.feed_forward.experts.5.w1,
587
+ model.layers.17.feed_forward.experts.5.w3, model.layers.17.feed_forward.experts.6.w1,
588
+ model.layers.17.feed_forward.experts.6.w3, model.layers.17.feed_forward.experts.7.w1,
589
+ model.layers.17.feed_forward.experts.7.w3, model.layers.17.feed_forward.experts.8.w1,
590
+ model.layers.17.feed_forward.experts.8.w3, model.layers.17.feed_forward.experts.9.w1,
591
+ model.layers.17.feed_forward.experts.9.w3, model.layers.17.feed_forward.experts.10.w1,
592
+ model.layers.17.feed_forward.experts.10.w3, model.layers.17.feed_forward.experts.11.w1,
593
+ model.layers.17.feed_forward.experts.11.w3, model.layers.17.feed_forward.experts.12.w1,
594
+ model.layers.17.feed_forward.experts.12.w3, model.layers.17.feed_forward.experts.13.w1,
595
+ model.layers.17.feed_forward.experts.13.w3, model.layers.17.feed_forward.experts.14.w1,
596
+ model.layers.17.feed_forward.experts.14.w3, model.layers.17.feed_forward.experts.15.w1,
597
+ model.layers.17.feed_forward.experts.15.w3, model.layers.17.feed_forward.experts.16.w1,
598
+ model.layers.17.feed_forward.experts.16.w3, model.layers.17.feed_forward.experts.17.w1,
599
+ model.layers.17.feed_forward.experts.17.w3, model.layers.17.feed_forward.experts.18.w1,
600
+ model.layers.17.feed_forward.experts.18.w3, model.layers.17.feed_forward.experts.19.w1,
601
+ model.layers.17.feed_forward.experts.19.w3, model.layers.17.feed_forward.experts.20.w1,
602
+ model.layers.17.feed_forward.experts.20.w3, model.layers.17.feed_forward.experts.21.w1,
603
+ model.layers.17.feed_forward.experts.21.w3, model.layers.17.feed_forward.experts.22.w1,
604
+ model.layers.17.feed_forward.experts.22.w3, model.layers.17.feed_forward.experts.23.w1,
605
+ model.layers.17.feed_forward.experts.23.w3, model.layers.17.feed_forward.experts.24.w1,
606
+ model.layers.17.feed_forward.experts.24.w3, model.layers.17.feed_forward.experts.25.w1,
607
+ model.layers.17.feed_forward.experts.25.w3, model.layers.17.feed_forward.experts.26.w1,
608
+ model.layers.17.feed_forward.experts.26.w3, model.layers.17.feed_forward.experts.27.w1,
609
+ model.layers.17.feed_forward.experts.27.w3, model.layers.17.feed_forward.experts.28.w1,
610
+ model.layers.17.feed_forward.experts.28.w3, model.layers.17.feed_forward.experts.29.w1,
611
+ model.layers.17.feed_forward.experts.29.w3, model.layers.17.feed_forward.experts.30.w1,
612
+ model.layers.17.feed_forward.experts.30.w3, model.layers.17.feed_forward.experts.31.w1,
613
+ model.layers.17.feed_forward.experts.31.w3]
614
+ - smooth_layer: model.layers.18.operator_norm
615
+ balance_layers: [model.layers.18.self_attn.q_proj, model.layers.18.self_attn.k_proj,
616
+ model.layers.18.self_attn.v_proj]
617
+ - smooth_layer: model.layers.18.ffn_norm
618
+ balance_layers: [model.layers.18.feed_forward.gate, model.layers.18.feed_forward.experts.0.w1,
619
+ model.layers.18.feed_forward.experts.0.w3, model.layers.18.feed_forward.experts.1.w1,
620
+ model.layers.18.feed_forward.experts.1.w3, model.layers.18.feed_forward.experts.2.w1,
621
+ model.layers.18.feed_forward.experts.2.w3, model.layers.18.feed_forward.experts.3.w1,
622
+ model.layers.18.feed_forward.experts.3.w3, model.layers.18.feed_forward.experts.4.w1,
623
+ model.layers.18.feed_forward.experts.4.w3, model.layers.18.feed_forward.experts.5.w1,
624
+ model.layers.18.feed_forward.experts.5.w3, model.layers.18.feed_forward.experts.6.w1,
625
+ model.layers.18.feed_forward.experts.6.w3, model.layers.18.feed_forward.experts.7.w1,
626
+ model.layers.18.feed_forward.experts.7.w3, model.layers.18.feed_forward.experts.8.w1,
627
+ model.layers.18.feed_forward.experts.8.w3, model.layers.18.feed_forward.experts.9.w1,
628
+ model.layers.18.feed_forward.experts.9.w3, model.layers.18.feed_forward.experts.10.w1,
629
+ model.layers.18.feed_forward.experts.10.w3, model.layers.18.feed_forward.experts.11.w1,
630
+ model.layers.18.feed_forward.experts.11.w3, model.layers.18.feed_forward.experts.12.w1,
631
+ model.layers.18.feed_forward.experts.12.w3, model.layers.18.feed_forward.experts.13.w1,
632
+ model.layers.18.feed_forward.experts.13.w3, model.layers.18.feed_forward.experts.14.w1,
633
+ model.layers.18.feed_forward.experts.14.w3, model.layers.18.feed_forward.experts.15.w1,
634
+ model.layers.18.feed_forward.experts.15.w3, model.layers.18.feed_forward.experts.16.w1,
635
+ model.layers.18.feed_forward.experts.16.w3, model.layers.18.feed_forward.experts.17.w1,
636
+ model.layers.18.feed_forward.experts.17.w3, model.layers.18.feed_forward.experts.18.w1,
637
+ model.layers.18.feed_forward.experts.18.w3, model.layers.18.feed_forward.experts.19.w1,
638
+ model.layers.18.feed_forward.experts.19.w3, model.layers.18.feed_forward.experts.20.w1,
639
+ model.layers.18.feed_forward.experts.20.w3, model.layers.18.feed_forward.experts.21.w1,
640
+ model.layers.18.feed_forward.experts.21.w3, model.layers.18.feed_forward.experts.22.w1,
641
+ model.layers.18.feed_forward.experts.22.w3, model.layers.18.feed_forward.experts.23.w1,
642
+ model.layers.18.feed_forward.experts.23.w3, model.layers.18.feed_forward.experts.24.w1,
643
+ model.layers.18.feed_forward.experts.24.w3, model.layers.18.feed_forward.experts.25.w1,
644
+ model.layers.18.feed_forward.experts.25.w3, model.layers.18.feed_forward.experts.26.w1,
645
+ model.layers.18.feed_forward.experts.26.w3, model.layers.18.feed_forward.experts.27.w1,
646
+ model.layers.18.feed_forward.experts.27.w3, model.layers.18.feed_forward.experts.28.w1,
647
+ model.layers.18.feed_forward.experts.28.w3, model.layers.18.feed_forward.experts.29.w1,
648
+ model.layers.18.feed_forward.experts.29.w3, model.layers.18.feed_forward.experts.30.w1,
649
+ model.layers.18.feed_forward.experts.30.w3, model.layers.18.feed_forward.experts.31.w1,
650
+ model.layers.18.feed_forward.experts.31.w3]
651
+ - smooth_layer: model.layers.19.operator_norm
652
+ balance_layers: [model.layers.19.conv.in_proj]
653
+ - smooth_layer: model.layers.19.ffn_norm
654
+ balance_layers: [model.layers.19.feed_forward.gate, model.layers.19.feed_forward.experts.0.w1,
655
+ model.layers.19.feed_forward.experts.0.w3, model.layers.19.feed_forward.experts.1.w1,
656
+ model.layers.19.feed_forward.experts.1.w3, model.layers.19.feed_forward.experts.2.w1,
657
+ model.layers.19.feed_forward.experts.2.w3, model.layers.19.feed_forward.experts.3.w1,
658
+ model.layers.19.feed_forward.experts.3.w3, model.layers.19.feed_forward.experts.4.w1,
659
+ model.layers.19.feed_forward.experts.4.w3, model.layers.19.feed_forward.experts.5.w1,
660
+ model.layers.19.feed_forward.experts.5.w3, model.layers.19.feed_forward.experts.6.w1,
661
+ model.layers.19.feed_forward.experts.6.w3, model.layers.19.feed_forward.experts.7.w1,
662
+ model.layers.19.feed_forward.experts.7.w3, model.layers.19.feed_forward.experts.8.w1,
663
+ model.layers.19.feed_forward.experts.8.w3, model.layers.19.feed_forward.experts.9.w1,
664
+ model.layers.19.feed_forward.experts.9.w3, model.layers.19.feed_forward.experts.10.w1,
665
+ model.layers.19.feed_forward.experts.10.w3, model.layers.19.feed_forward.experts.11.w1,
666
+ model.layers.19.feed_forward.experts.11.w3, model.layers.19.feed_forward.experts.12.w1,
667
+ model.layers.19.feed_forward.experts.12.w3, model.layers.19.feed_forward.experts.13.w1,
668
+ model.layers.19.feed_forward.experts.13.w3, model.layers.19.feed_forward.experts.14.w1,
669
+ model.layers.19.feed_forward.experts.14.w3, model.layers.19.feed_forward.experts.15.w1,
670
+ model.layers.19.feed_forward.experts.15.w3, model.layers.19.feed_forward.experts.16.w1,
671
+ model.layers.19.feed_forward.experts.16.w3, model.layers.19.feed_forward.experts.17.w1,
672
+ model.layers.19.feed_forward.experts.17.w3, model.layers.19.feed_forward.experts.18.w1,
673
+ model.layers.19.feed_forward.experts.18.w3, model.layers.19.feed_forward.experts.19.w1,
674
+ model.layers.19.feed_forward.experts.19.w3, model.layers.19.feed_forward.experts.20.w1,
675
+ model.layers.19.feed_forward.experts.20.w3, model.layers.19.feed_forward.experts.21.w1,
676
+ model.layers.19.feed_forward.experts.21.w3, model.layers.19.feed_forward.experts.22.w1,
677
+ model.layers.19.feed_forward.experts.22.w3, model.layers.19.feed_forward.experts.23.w1,
678
+ model.layers.19.feed_forward.experts.23.w3, model.layers.19.feed_forward.experts.24.w1,
679
+ model.layers.19.feed_forward.experts.24.w3, model.layers.19.feed_forward.experts.25.w1,
680
+ model.layers.19.feed_forward.experts.25.w3, model.layers.19.feed_forward.experts.26.w1,
681
+ model.layers.19.feed_forward.experts.26.w3, model.layers.19.feed_forward.experts.27.w1,
682
+ model.layers.19.feed_forward.experts.27.w3, model.layers.19.feed_forward.experts.28.w1,
683
+ model.layers.19.feed_forward.experts.28.w3, model.layers.19.feed_forward.experts.29.w1,
684
+ model.layers.19.feed_forward.experts.29.w3, model.layers.19.feed_forward.experts.30.w1,
685
+ model.layers.19.feed_forward.experts.30.w3, model.layers.19.feed_forward.experts.31.w1,
686
+ model.layers.19.feed_forward.experts.31.w3]
687
+ - smooth_layer: model.layers.20.operator_norm
688
+ balance_layers: [model.layers.20.conv.in_proj]
689
+ - smooth_layer: model.layers.20.ffn_norm
690
+ balance_layers: [model.layers.20.feed_forward.gate, model.layers.20.feed_forward.experts.0.w1,
691
+ model.layers.20.feed_forward.experts.0.w3, model.layers.20.feed_forward.experts.1.w1,
692
+ model.layers.20.feed_forward.experts.1.w3, model.layers.20.feed_forward.experts.2.w1,
693
+ model.layers.20.feed_forward.experts.2.w3, model.layers.20.feed_forward.experts.3.w1,
694
+ model.layers.20.feed_forward.experts.3.w3, model.layers.20.feed_forward.experts.4.w1,
695
+ model.layers.20.feed_forward.experts.4.w3, model.layers.20.feed_forward.experts.5.w1,
696
+ model.layers.20.feed_forward.experts.5.w3, model.layers.20.feed_forward.experts.6.w1,
697
+ model.layers.20.feed_forward.experts.6.w3, model.layers.20.feed_forward.experts.7.w1,
698
+ model.layers.20.feed_forward.experts.7.w3, model.layers.20.feed_forward.experts.8.w1,
699
+ model.layers.20.feed_forward.experts.8.w3, model.layers.20.feed_forward.experts.9.w1,
700
+ model.layers.20.feed_forward.experts.9.w3, model.layers.20.feed_forward.experts.10.w1,
701
+ model.layers.20.feed_forward.experts.10.w3, model.layers.20.feed_forward.experts.11.w1,
702
+ model.layers.20.feed_forward.experts.11.w3, model.layers.20.feed_forward.experts.12.w1,
703
+ model.layers.20.feed_forward.experts.12.w3, model.layers.20.feed_forward.experts.13.w1,
704
+ model.layers.20.feed_forward.experts.13.w3, model.layers.20.feed_forward.experts.14.w1,
705
+ model.layers.20.feed_forward.experts.14.w3, model.layers.20.feed_forward.experts.15.w1,
706
+ model.layers.20.feed_forward.experts.15.w3, model.layers.20.feed_forward.experts.16.w1,
707
+ model.layers.20.feed_forward.experts.16.w3, model.layers.20.feed_forward.experts.17.w1,
708
+ model.layers.20.feed_forward.experts.17.w3, model.layers.20.feed_forward.experts.18.w1,
709
+ model.layers.20.feed_forward.experts.18.w3, model.layers.20.feed_forward.experts.19.w1,
710
+ model.layers.20.feed_forward.experts.19.w3, model.layers.20.feed_forward.experts.20.w1,
711
+ model.layers.20.feed_forward.experts.20.w3, model.layers.20.feed_forward.experts.21.w1,
712
+ model.layers.20.feed_forward.experts.21.w3, model.layers.20.feed_forward.experts.22.w1,
713
+ model.layers.20.feed_forward.experts.22.w3, model.layers.20.feed_forward.experts.23.w1,
714
+ model.layers.20.feed_forward.experts.23.w3, model.layers.20.feed_forward.experts.24.w1,
715
+ model.layers.20.feed_forward.experts.24.w3, model.layers.20.feed_forward.experts.25.w1,
716
+ model.layers.20.feed_forward.experts.25.w3, model.layers.20.feed_forward.experts.26.w1,
717
+ model.layers.20.feed_forward.experts.26.w3, model.layers.20.feed_forward.experts.27.w1,
718
+ model.layers.20.feed_forward.experts.27.w3, model.layers.20.feed_forward.experts.28.w1,
719
+ model.layers.20.feed_forward.experts.28.w3, model.layers.20.feed_forward.experts.29.w1,
720
+ model.layers.20.feed_forward.experts.29.w3, model.layers.20.feed_forward.experts.30.w1,
721
+ model.layers.20.feed_forward.experts.30.w3, model.layers.20.feed_forward.experts.31.w1,
722
+ model.layers.20.feed_forward.experts.31.w3]
723
+ - smooth_layer: model.layers.21.operator_norm
724
+ balance_layers: [model.layers.21.self_attn.q_proj, model.layers.21.self_attn.k_proj,
725
+ model.layers.21.self_attn.v_proj]
726
+ - smooth_layer: model.layers.21.ffn_norm
727
+ balance_layers: [model.layers.21.feed_forward.gate, model.layers.21.feed_forward.experts.0.w1,
728
+ model.layers.21.feed_forward.experts.0.w3, model.layers.21.feed_forward.experts.1.w1,
729
+ model.layers.21.feed_forward.experts.1.w3, model.layers.21.feed_forward.experts.2.w1,
730
+ model.layers.21.feed_forward.experts.2.w3, model.layers.21.feed_forward.experts.3.w1,
731
+ model.layers.21.feed_forward.experts.3.w3, model.layers.21.feed_forward.experts.4.w1,
732
+ model.layers.21.feed_forward.experts.4.w3, model.layers.21.feed_forward.experts.5.w1,
733
+ model.layers.21.feed_forward.experts.5.w3, model.layers.21.feed_forward.experts.6.w1,
734
+ model.layers.21.feed_forward.experts.6.w3, model.layers.21.feed_forward.experts.7.w1,
735
+ model.layers.21.feed_forward.experts.7.w3, model.layers.21.feed_forward.experts.8.w1,
736
+ model.layers.21.feed_forward.experts.8.w3, model.layers.21.feed_forward.experts.9.w1,
737
+ model.layers.21.feed_forward.experts.9.w3, model.layers.21.feed_forward.experts.10.w1,
738
+ model.layers.21.feed_forward.experts.10.w3, model.layers.21.feed_forward.experts.11.w1,
739
+ model.layers.21.feed_forward.experts.11.w3, model.layers.21.feed_forward.experts.12.w1,
740
+ model.layers.21.feed_forward.experts.12.w3, model.layers.21.feed_forward.experts.13.w1,
741
+ model.layers.21.feed_forward.experts.13.w3, model.layers.21.feed_forward.experts.14.w1,
742
+ model.layers.21.feed_forward.experts.14.w3, model.layers.21.feed_forward.experts.15.w1,
743
+ model.layers.21.feed_forward.experts.15.w3, model.layers.21.feed_forward.experts.16.w1,
744
+ model.layers.21.feed_forward.experts.16.w3, model.layers.21.feed_forward.experts.17.w1,
745
+ model.layers.21.feed_forward.experts.17.w3, model.layers.21.feed_forward.experts.18.w1,
746
+ model.layers.21.feed_forward.experts.18.w3, model.layers.21.feed_forward.experts.19.w1,
747
+ model.layers.21.feed_forward.experts.19.w3, model.layers.21.feed_forward.experts.20.w1,
748
+ model.layers.21.feed_forward.experts.20.w3, model.layers.21.feed_forward.experts.21.w1,
749
+ model.layers.21.feed_forward.experts.21.w3, model.layers.21.feed_forward.experts.22.w1,
750
+ model.layers.21.feed_forward.experts.22.w3, model.layers.21.feed_forward.experts.23.w1,
751
+ model.layers.21.feed_forward.experts.23.w3, model.layers.21.feed_forward.experts.24.w1,
752
+ model.layers.21.feed_forward.experts.24.w3, model.layers.21.feed_forward.experts.25.w1,
753
+ model.layers.21.feed_forward.experts.25.w3, model.layers.21.feed_forward.experts.26.w1,
754
+ model.layers.21.feed_forward.experts.26.w3, model.layers.21.feed_forward.experts.27.w1,
755
+ model.layers.21.feed_forward.experts.27.w3, model.layers.21.feed_forward.experts.28.w1,
756
+ model.layers.21.feed_forward.experts.28.w3, model.layers.21.feed_forward.experts.29.w1,
757
+ model.layers.21.feed_forward.experts.29.w3, model.layers.21.feed_forward.experts.30.w1,
758
+ model.layers.21.feed_forward.experts.30.w3, model.layers.21.feed_forward.experts.31.w1,
759
+ model.layers.21.feed_forward.experts.31.w3]
760
+ - smooth_layer: model.layers.22.operator_norm
761
+ balance_layers: [model.layers.22.conv.in_proj]
762
+ - smooth_layer: model.layers.22.ffn_norm
763
+ balance_layers: [model.layers.22.feed_forward.gate, model.layers.22.feed_forward.experts.0.w1,
764
+ model.layers.22.feed_forward.experts.0.w3, model.layers.22.feed_forward.experts.1.w1,
765
+ model.layers.22.feed_forward.experts.1.w3, model.layers.22.feed_forward.experts.2.w1,
766
+ model.layers.22.feed_forward.experts.2.w3, model.layers.22.feed_forward.experts.3.w1,
767
+ model.layers.22.feed_forward.experts.3.w3, model.layers.22.feed_forward.experts.4.w1,
768
+ model.layers.22.feed_forward.experts.4.w3, model.layers.22.feed_forward.experts.5.w1,
769
+ model.layers.22.feed_forward.experts.5.w3, model.layers.22.feed_forward.experts.6.w1,
770
+ model.layers.22.feed_forward.experts.6.w3, model.layers.22.feed_forward.experts.7.w1,
771
+ model.layers.22.feed_forward.experts.7.w3, model.layers.22.feed_forward.experts.8.w1,
772
+ model.layers.22.feed_forward.experts.8.w3, model.layers.22.feed_forward.experts.9.w1,
773
+ model.layers.22.feed_forward.experts.9.w3, model.layers.22.feed_forward.experts.10.w1,
774
+ model.layers.22.feed_forward.experts.10.w3, model.layers.22.feed_forward.experts.11.w1,
775
+ model.layers.22.feed_forward.experts.11.w3, model.layers.22.feed_forward.experts.12.w1,
776
+ model.layers.22.feed_forward.experts.12.w3, model.layers.22.feed_forward.experts.13.w1,
777
+ model.layers.22.feed_forward.experts.13.w3, model.layers.22.feed_forward.experts.14.w1,
778
+ model.layers.22.feed_forward.experts.14.w3, model.layers.22.feed_forward.experts.15.w1,
779
+ model.layers.22.feed_forward.experts.15.w3, model.layers.22.feed_forward.experts.16.w1,
780
+ model.layers.22.feed_forward.experts.16.w3, model.layers.22.feed_forward.experts.17.w1,
781
+ model.layers.22.feed_forward.experts.17.w3, model.layers.22.feed_forward.experts.18.w1,
782
+ model.layers.22.feed_forward.experts.18.w3, model.layers.22.feed_forward.experts.19.w1,
783
+ model.layers.22.feed_forward.experts.19.w3, model.layers.22.feed_forward.experts.20.w1,
784
+ model.layers.22.feed_forward.experts.20.w3, model.layers.22.feed_forward.experts.21.w1,
785
+ model.layers.22.feed_forward.experts.21.w3, model.layers.22.feed_forward.experts.22.w1,
786
+ model.layers.22.feed_forward.experts.22.w3, model.layers.22.feed_forward.experts.23.w1,
787
+ model.layers.22.feed_forward.experts.23.w3, model.layers.22.feed_forward.experts.24.w1,
788
+ model.layers.22.feed_forward.experts.24.w3, model.layers.22.feed_forward.experts.25.w1,
789
+ model.layers.22.feed_forward.experts.25.w3, model.layers.22.feed_forward.experts.26.w1,
790
+ model.layers.22.feed_forward.experts.26.w3, model.layers.22.feed_forward.experts.27.w1,
791
+ model.layers.22.feed_forward.experts.27.w3, model.layers.22.feed_forward.experts.28.w1,
792
+ model.layers.22.feed_forward.experts.28.w3, model.layers.22.feed_forward.experts.29.w1,
793
+ model.layers.22.feed_forward.experts.29.w3, model.layers.22.feed_forward.experts.30.w1,
794
+ model.layers.22.feed_forward.experts.30.w3, model.layers.22.feed_forward.experts.31.w1,
795
+ model.layers.22.feed_forward.experts.31.w3]
796
+ - smooth_layer: model.layers.23.operator_norm
797
+ balance_layers: [model.layers.23.conv.in_proj]
798
+ - smooth_layer: model.layers.23.ffn_norm
799
+ balance_layers: [model.layers.23.feed_forward.gate, model.layers.23.feed_forward.experts.0.w1,
800
+ model.layers.23.feed_forward.experts.0.w3, model.layers.23.feed_forward.experts.1.w1,
801
+ model.layers.23.feed_forward.experts.1.w3, model.layers.23.feed_forward.experts.2.w1,
802
+ model.layers.23.feed_forward.experts.2.w3, model.layers.23.feed_forward.experts.3.w1,
803
+ model.layers.23.feed_forward.experts.3.w3, model.layers.23.feed_forward.experts.4.w1,
804
+ model.layers.23.feed_forward.experts.4.w3, model.layers.23.feed_forward.experts.5.w1,
805
+ model.layers.23.feed_forward.experts.5.w3, model.layers.23.feed_forward.experts.6.w1,
806
+ model.layers.23.feed_forward.experts.6.w3, model.layers.23.feed_forward.experts.7.w1,
807
+ model.layers.23.feed_forward.experts.7.w3, model.layers.23.feed_forward.experts.8.w1,
808
+ model.layers.23.feed_forward.experts.8.w3, model.layers.23.feed_forward.experts.9.w1,
809
+ model.layers.23.feed_forward.experts.9.w3, model.layers.23.feed_forward.experts.10.w1,
810
+ model.layers.23.feed_forward.experts.10.w3, model.layers.23.feed_forward.experts.11.w1,
811
+ model.layers.23.feed_forward.experts.11.w3, model.layers.23.feed_forward.experts.12.w1,
812
+ model.layers.23.feed_forward.experts.12.w3, model.layers.23.feed_forward.experts.13.w1,
813
+ model.layers.23.feed_forward.experts.13.w3, model.layers.23.feed_forward.experts.14.w1,
814
+ model.layers.23.feed_forward.experts.14.w3, model.layers.23.feed_forward.experts.15.w1,
815
+ model.layers.23.feed_forward.experts.15.w3, model.layers.23.feed_forward.experts.16.w1,
816
+ model.layers.23.feed_forward.experts.16.w3, model.layers.23.feed_forward.experts.17.w1,
817
+ model.layers.23.feed_forward.experts.17.w3, model.layers.23.feed_forward.experts.18.w1,
818
+ model.layers.23.feed_forward.experts.18.w3, model.layers.23.feed_forward.experts.19.w1,
819
+ model.layers.23.feed_forward.experts.19.w3, model.layers.23.feed_forward.experts.20.w1,
820
+ model.layers.23.feed_forward.experts.20.w3, model.layers.23.feed_forward.experts.21.w1,
821
+ model.layers.23.feed_forward.experts.21.w3, model.layers.23.feed_forward.experts.22.w1,
822
+ model.layers.23.feed_forward.experts.22.w3, model.layers.23.feed_forward.experts.23.w1,
823
+ model.layers.23.feed_forward.experts.23.w3, model.layers.23.feed_forward.experts.24.w1,
824
+ model.layers.23.feed_forward.experts.24.w3, model.layers.23.feed_forward.experts.25.w1,
825
+ model.layers.23.feed_forward.experts.25.w3, model.layers.23.feed_forward.experts.26.w1,
826
+ model.layers.23.feed_forward.experts.26.w3, model.layers.23.feed_forward.experts.27.w1,
827
+ model.layers.23.feed_forward.experts.27.w3, model.layers.23.feed_forward.experts.28.w1,
828
+ model.layers.23.feed_forward.experts.28.w3, model.layers.23.feed_forward.experts.29.w1,
829
+ model.layers.23.feed_forward.experts.29.w3, model.layers.23.feed_forward.experts.30.w1,
830
+ model.layers.23.feed_forward.experts.30.w3, model.layers.23.feed_forward.experts.31.w1,
831
+ model.layers.23.feed_forward.experts.31.w3]
832
+ - smooth_layer: model.embedding_norm
833
+ balance_layers: [lm_head]
834
+ duo_scaling: true
special_tokens_map.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|im_end|>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<|pad|>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,4078 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "added_tokens_decoder": {
5
+ "0": {
6
+ "content": "<|pad|>",
7
+ "lstrip": false,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "1": {
14
+ "content": "<|startoftext|>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "2": {
22
+ "content": "<|endoftext|>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ },
29
+ "3": {
30
+ "content": "<|fim_pre|>",
31
+ "lstrip": false,
32
+ "normalized": false,
33
+ "rstrip": false,
34
+ "single_word": false,
35
+ "special": true
36
+ },
37
+ "4": {
38
+ "content": "<|fim_mid|>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false,
43
+ "special": true
44
+ },
45
+ "5": {
46
+ "content": "<|fim_suf|>",
47
+ "lstrip": false,
48
+ "normalized": false,
49
+ "rstrip": false,
50
+ "single_word": false,
51
+ "special": true
52
+ },
53
+ "6": {
54
+ "content": "<|im_start|>",
55
+ "lstrip": false,
56
+ "normalized": false,
57
+ "rstrip": false,
58
+ "single_word": false,
59
+ "special": true
60
+ },
61
+ "7": {
62
+ "content": "<|im_end|>",
63
+ "lstrip": false,
64
+ "normalized": false,
65
+ "rstrip": false,
66
+ "single_word": false,
67
+ "special": true
68
+ },
69
+ "8": {
70
+ "content": "<|tool_list_start|>",
71
+ "lstrip": false,
72
+ "normalized": false,
73
+ "rstrip": false,
74
+ "single_word": false,
75
+ "special": true
76
+ },
77
+ "9": {
78
+ "content": "<|tool_list_end|>",
79
+ "lstrip": false,
80
+ "normalized": false,
81
+ "rstrip": false,
82
+ "single_word": false,
83
+ "special": true
84
+ },
85
+ "10": {
86
+ "content": "<|tool_call_start|>",
87
+ "lstrip": false,
88
+ "normalized": false,
89
+ "rstrip": false,
90
+ "single_word": false,
91
+ "special": false
92
+ },
93
+ "11": {
94
+ "content": "<|tool_call_end|>",
95
+ "lstrip": false,
96
+ "normalized": false,
97
+ "rstrip": false,
98
+ "single_word": false,
99
+ "special": false
100
+ },
101
+ "12": {
102
+ "content": "<|tool_response_start|>",
103
+ "lstrip": false,
104
+ "normalized": false,
105
+ "rstrip": false,
106
+ "single_word": false,
107
+ "special": true
108
+ },
109
+ "13": {
110
+ "content": "<|tool_response_end|>",
111
+ "lstrip": false,
112
+ "normalized": false,
113
+ "rstrip": false,
114
+ "single_word": false,
115
+ "special": true
116
+ },
117
+ "16": {
118
+ "content": "<|reserved_6|>",
119
+ "lstrip": false,
120
+ "normalized": false,
121
+ "rstrip": false,
122
+ "single_word": false,
123
+ "special": true
124
+ },
125
+ "17": {
126
+ "content": "<|reserved_7|>",
127
+ "lstrip": false,
128
+ "normalized": false,
129
+ "rstrip": false,
130
+ "single_word": false,
131
+ "special": true
132
+ },
133
+ "18": {
134
+ "content": "<|reserved_8|>",
135
+ "lstrip": false,
136
+ "normalized": false,
137
+ "rstrip": false,
138
+ "single_word": false,
139
+ "special": true
140
+ },
141
+ "19": {
142
+ "content": "<|reserved_9|>",
143
+ "lstrip": false,
144
+ "normalized": false,
145
+ "rstrip": false,
146
+ "single_word": false,
147
+ "special": true
148
+ },
149
+ "20": {
150
+ "content": "<|reserved_10|>",
151
+ "lstrip": false,
152
+ "normalized": false,
153
+ "rstrip": false,
154
+ "single_word": false,
155
+ "special": true
156
+ },
157
+ "21": {
158
+ "content": "<|reserved_11|>",
159
+ "lstrip": false,
160
+ "normalized": false,
161
+ "rstrip": false,
162
+ "single_word": false,
163
+ "special": true
164
+ },
165
+ "22": {
166
+ "content": "<|reserved_12|>",
167
+ "lstrip": false,
168
+ "normalized": false,
169
+ "rstrip": false,
170
+ "single_word": false,
171
+ "special": true
172
+ },
173
+ "23": {
174
+ "content": "<|reserved_13|>",
175
+ "lstrip": false,
176
+ "normalized": false,
177
+ "rstrip": false,
178
+ "single_word": false,
179
+ "special": true
180
+ },
181
+ "24": {
182
+ "content": "<|reserved_14|>",
183
+ "lstrip": false,
184
+ "normalized": false,
185
+ "rstrip": false,
186
+ "single_word": false,
187
+ "special": true
188
+ },
189
+ "25": {
190
+ "content": "<|reserved_15|>",
191
+ "lstrip": false,
192
+ "normalized": false,
193
+ "rstrip": false,
194
+ "single_word": false,
195
+ "special": true
196
+ },
197
+ "26": {
198
+ "content": "<|reserved_16|>",
199
+ "lstrip": false,
200
+ "normalized": false,
201
+ "rstrip": false,
202
+ "single_word": false,
203
+ "special": true
204
+ },
205
+ "27": {
206
+ "content": "<|reserved_17|>",
207
+ "lstrip": false,
208
+ "normalized": false,
209
+ "rstrip": false,
210
+ "single_word": false,
211
+ "special": true
212
+ },
213
+ "28": {
214
+ "content": "<|reserved_18|>",
215
+ "lstrip": false,
216
+ "normalized": false,
217
+ "rstrip": false,
218
+ "single_word": false,
219
+ "special": true
220
+ },
221
+ "29": {
222
+ "content": "<|reserved_19|>",
223
+ "lstrip": false,
224
+ "normalized": false,
225
+ "rstrip": false,
226
+ "single_word": false,
227
+ "special": true
228
+ },
229
+ "30": {
230
+ "content": "<|reserved_20|>",
231
+ "lstrip": false,
232
+ "normalized": false,
233
+ "rstrip": false,
234
+ "single_word": false,
235
+ "special": true
236
+ },
237
+ "31": {
238
+ "content": "<|reserved_21|>",
239
+ "lstrip": false,
240
+ "normalized": false,
241
+ "rstrip": false,
242
+ "single_word": false,
243
+ "special": true
244
+ },
245
+ "32": {
246
+ "content": "<|reserved_22|>",
247
+ "lstrip": false,
248
+ "normalized": false,
249
+ "rstrip": false,
250
+ "single_word": false,
251
+ "special": true
252
+ },
253
+ "33": {
254
+ "content": "<|reserved_23|>",
255
+ "lstrip": false,
256
+ "normalized": false,
257
+ "rstrip": false,
258
+ "single_word": false,
259
+ "special": true
260
+ },
261
+ "34": {
262
+ "content": "<|reserved_24|>",
263
+ "lstrip": false,
264
+ "normalized": false,
265
+ "rstrip": false,
266
+ "single_word": false,
267
+ "special": true
268
+ },
269
+ "35": {
270
+ "content": "<|reserved_25|>",
271
+ "lstrip": false,
272
+ "normalized": false,
273
+ "rstrip": false,
274
+ "single_word": false,
275
+ "special": true
276
+ },
277
+ "36": {
278
+ "content": "<|reserved_26|>",
279
+ "lstrip": false,
280
+ "normalized": false,
281
+ "rstrip": false,
282
+ "single_word": false,
283
+ "special": true
284
+ },
285
+ "37": {
286
+ "content": "<|reserved_27|>",
287
+ "lstrip": false,
288
+ "normalized": false,
289
+ "rstrip": false,
290
+ "single_word": false,
291
+ "special": true
292
+ },
293
+ "38": {
294
+ "content": "<|reserved_28|>",
295
+ "lstrip": false,
296
+ "normalized": false,
297
+ "rstrip": false,
298
+ "single_word": false,
299
+ "special": true
300
+ },
301
+ "39": {
302
+ "content": "<|reserved_29|>",
303
+ "lstrip": false,
304
+ "normalized": false,
305
+ "rstrip": false,
306
+ "single_word": false,
307
+ "special": true
308
+ },
309
+ "40": {
310
+ "content": "<|reserved_30|>",
311
+ "lstrip": false,
312
+ "normalized": false,
313
+ "rstrip": false,
314
+ "single_word": false,
315
+ "special": true
316
+ },
317
+ "41": {
318
+ "content": "<|reserved_31|>",
319
+ "lstrip": false,
320
+ "normalized": false,
321
+ "rstrip": false,
322
+ "single_word": false,
323
+ "special": true
324
+ },
325
+ "42": {
326
+ "content": "<|reserved_32|>",
327
+ "lstrip": false,
328
+ "normalized": false,
329
+ "rstrip": false,
330
+ "single_word": false,
331
+ "special": true
332
+ },
333
+ "43": {
334
+ "content": "<|reserved_33|>",
335
+ "lstrip": false,
336
+ "normalized": false,
337
+ "rstrip": false,
338
+ "single_word": false,
339
+ "special": true
340
+ },
341
+ "44": {
342
+ "content": "<|reserved_34|>",
343
+ "lstrip": false,
344
+ "normalized": false,
345
+ "rstrip": false,
346
+ "single_word": false,
347
+ "special": true
348
+ },
349
+ "45": {
350
+ "content": "<|reserved_35|>",
351
+ "lstrip": false,
352
+ "normalized": false,
353
+ "rstrip": false,
354
+ "single_word": false,
355
+ "special": true
356
+ },
357
+ "46": {
358
+ "content": "<|reserved_36|>",
359
+ "lstrip": false,
360
+ "normalized": false,
361
+ "rstrip": false,
362
+ "single_word": false,
363
+ "special": true
364
+ },
365
+ "47": {
366
+ "content": "<|reserved_37|>",
367
+ "lstrip": false,
368
+ "normalized": false,
369
+ "rstrip": false,
370
+ "single_word": false,
371
+ "special": true
372
+ },
373
+ "48": {
374
+ "content": "<|reserved_38|>",
375
+ "lstrip": false,
376
+ "normalized": false,
377
+ "rstrip": false,
378
+ "single_word": false,
379
+ "special": true
380
+ },
381
+ "49": {
382
+ "content": "<|reserved_39|>",
383
+ "lstrip": false,
384
+ "normalized": false,
385
+ "rstrip": false,
386
+ "single_word": false,
387
+ "special": true
388
+ },
389
+ "50": {
390
+ "content": "<|reserved_40|>",
391
+ "lstrip": false,
392
+ "normalized": false,
393
+ "rstrip": false,
394
+ "single_word": false,
395
+ "special": true
396
+ },
397
+ "51": {
398
+ "content": "<|reserved_41|>",
399
+ "lstrip": false,
400
+ "normalized": false,
401
+ "rstrip": false,
402
+ "single_word": false,
403
+ "special": true
404
+ },
405
+ "52": {
406
+ "content": "<|reserved_42|>",
407
+ "lstrip": false,
408
+ "normalized": false,
409
+ "rstrip": false,
410
+ "single_word": false,
411
+ "special": true
412
+ },
413
+ "53": {
414
+ "content": "<|reserved_43|>",
415
+ "lstrip": false,
416
+ "normalized": false,
417
+ "rstrip": false,
418
+ "single_word": false,
419
+ "special": true
420
+ },
421
+ "54": {
422
+ "content": "<|reserved_44|>",
423
+ "lstrip": false,
424
+ "normalized": false,
425
+ "rstrip": false,
426
+ "single_word": false,
427
+ "special": true
428
+ },
429
+ "55": {
430
+ "content": "<|reserved_45|>",
431
+ "lstrip": false,
432
+ "normalized": false,
433
+ "rstrip": false,
434
+ "single_word": false,
435
+ "special": true
436
+ },
437
+ "56": {
438
+ "content": "<|reserved_46|>",
439
+ "lstrip": false,
440
+ "normalized": false,
441
+ "rstrip": false,
442
+ "single_word": false,
443
+ "special": true
444
+ },
445
+ "57": {
446
+ "content": "<|reserved_47|>",
447
+ "lstrip": false,
448
+ "normalized": false,
449
+ "rstrip": false,
450
+ "single_word": false,
451
+ "special": true
452
+ },
453
+ "58": {
454
+ "content": "<|reserved_48|>",
455
+ "lstrip": false,
456
+ "normalized": false,
457
+ "rstrip": false,
458
+ "single_word": false,
459
+ "special": true
460
+ },
461
+ "59": {
462
+ "content": "<|reserved_49|>",
463
+ "lstrip": false,
464
+ "normalized": false,
465
+ "rstrip": false,
466
+ "single_word": false,
467
+ "special": true
468
+ },
469
+ "60": {
470
+ "content": "<|reserved_50|>",
471
+ "lstrip": false,
472
+ "normalized": false,
473
+ "rstrip": false,
474
+ "single_word": false,
475
+ "special": true
476
+ },
477
+ "61": {
478
+ "content": "<|reserved_51|>",
479
+ "lstrip": false,
480
+ "normalized": false,
481
+ "rstrip": false,
482
+ "single_word": false,
483
+ "special": true
484
+ },
485
+ "62": {
486
+ "content": "<|reserved_52|>",
487
+ "lstrip": false,
488
+ "normalized": false,
489
+ "rstrip": false,
490
+ "single_word": false,
491
+ "special": true
492
+ },
493
+ "63": {
494
+ "content": "<|reserved_53|>",
495
+ "lstrip": false,
496
+ "normalized": false,
497
+ "rstrip": false,
498
+ "single_word": false,
499
+ "special": true
500
+ },
501
+ "64": {
502
+ "content": "<|reserved_54|>",
503
+ "lstrip": false,
504
+ "normalized": false,
505
+ "rstrip": false,
506
+ "single_word": false,
507
+ "special": true
508
+ },
509
+ "65": {
510
+ "content": "<|reserved_55|>",
511
+ "lstrip": false,
512
+ "normalized": false,
513
+ "rstrip": false,
514
+ "single_word": false,
515
+ "special": true
516
+ },
517
+ "66": {
518
+ "content": "<|reserved_56|>",
519
+ "lstrip": false,
520
+ "normalized": false,
521
+ "rstrip": false,
522
+ "single_word": false,
523
+ "special": true
524
+ },
525
+ "67": {
526
+ "content": "<|reserved_57|>",
527
+ "lstrip": false,
528
+ "normalized": false,
529
+ "rstrip": false,
530
+ "single_word": false,
531
+ "special": true
532
+ },
533
+ "68": {
534
+ "content": "<|reserved_58|>",
535
+ "lstrip": false,
536
+ "normalized": false,
537
+ "rstrip": false,
538
+ "single_word": false,
539
+ "special": true
540
+ },
541
+ "69": {
542
+ "content": "<|reserved_59|>",
543
+ "lstrip": false,
544
+ "normalized": false,
545
+ "rstrip": false,
546
+ "single_word": false,
547
+ "special": true
548
+ },
549
+ "70": {
550
+ "content": "<|reserved_60|>",
551
+ "lstrip": false,
552
+ "normalized": false,
553
+ "rstrip": false,
554
+ "single_word": false,
555
+ "special": true
556
+ },
557
+ "71": {
558
+ "content": "<|reserved_61|>",
559
+ "lstrip": false,
560
+ "normalized": false,
561
+ "rstrip": false,
562
+ "single_word": false,
563
+ "special": true
564
+ },
565
+ "72": {
566
+ "content": "<|reserved_62|>",
567
+ "lstrip": false,
568
+ "normalized": false,
569
+ "rstrip": false,
570
+ "single_word": false,
571
+ "special": true
572
+ },
573
+ "73": {
574
+ "content": "<|reserved_63|>",
575
+ "lstrip": false,
576
+ "normalized": false,
577
+ "rstrip": false,
578
+ "single_word": false,
579
+ "special": true
580
+ },
581
+ "74": {
582
+ "content": "<|reserved_64|>",
583
+ "lstrip": false,
584
+ "normalized": false,
585
+ "rstrip": false,
586
+ "single_word": false,
587
+ "special": true
588
+ },
589
+ "75": {
590
+ "content": "<|reserved_65|>",
591
+ "lstrip": false,
592
+ "normalized": false,
593
+ "rstrip": false,
594
+ "single_word": false,
595
+ "special": true
596
+ },
597
+ "76": {
598
+ "content": "<|reserved_66|>",
599
+ "lstrip": false,
600
+ "normalized": false,
601
+ "rstrip": false,
602
+ "single_word": false,
603
+ "special": true
604
+ },
605
+ "77": {
606
+ "content": "<|reserved_67|>",
607
+ "lstrip": false,
608
+ "normalized": false,
609
+ "rstrip": false,
610
+ "single_word": false,
611
+ "special": true
612
+ },
613
+ "78": {
614
+ "content": "<|reserved_68|>",
615
+ "lstrip": false,
616
+ "normalized": false,
617
+ "rstrip": false,
618
+ "single_word": false,
619
+ "special": true
620
+ },
621
+ "79": {
622
+ "content": "<|reserved_69|>",
623
+ "lstrip": false,
624
+ "normalized": false,
625
+ "rstrip": false,
626
+ "single_word": false,
627
+ "special": true
628
+ },
629
+ "80": {
630
+ "content": "<|reserved_70|>",
631
+ "lstrip": false,
632
+ "normalized": false,
633
+ "rstrip": false,
634
+ "single_word": false,
635
+ "special": true
636
+ },
637
+ "81": {
638
+ "content": "<|reserved_71|>",
639
+ "lstrip": false,
640
+ "normalized": false,
641
+ "rstrip": false,
642
+ "single_word": false,
643
+ "special": true
644
+ },
645
+ "82": {
646
+ "content": "<|reserved_72|>",
647
+ "lstrip": false,
648
+ "normalized": false,
649
+ "rstrip": false,
650
+ "single_word": false,
651
+ "special": true
652
+ },
653
+ "83": {
654
+ "content": "<|reserved_73|>",
655
+ "lstrip": false,
656
+ "normalized": false,
657
+ "rstrip": false,
658
+ "single_word": false,
659
+ "special": true
660
+ },
661
+ "84": {
662
+ "content": "<|reserved_74|>",
663
+ "lstrip": false,
664
+ "normalized": false,
665
+ "rstrip": false,
666
+ "single_word": false,
667
+ "special": true
668
+ },
669
+ "85": {
670
+ "content": "<|reserved_75|>",
671
+ "lstrip": false,
672
+ "normalized": false,
673
+ "rstrip": false,
674
+ "single_word": false,
675
+ "special": true
676
+ },
677
+ "86": {
678
+ "content": "<|reserved_76|>",
679
+ "lstrip": false,
680
+ "normalized": false,
681
+ "rstrip": false,
682
+ "single_word": false,
683
+ "special": true
684
+ },
685
+ "87": {
686
+ "content": "<|reserved_77|>",
687
+ "lstrip": false,
688
+ "normalized": false,
689
+ "rstrip": false,
690
+ "single_word": false,
691
+ "special": true
692
+ },
693
+ "88": {
694
+ "content": "<|reserved_78|>",
695
+ "lstrip": false,
696
+ "normalized": false,
697
+ "rstrip": false,
698
+ "single_word": false,
699
+ "special": true
700
+ },
701
+ "89": {
702
+ "content": "<|reserved_79|>",
703
+ "lstrip": false,
704
+ "normalized": false,
705
+ "rstrip": false,
706
+ "single_word": false,
707
+ "special": true
708
+ },
709
+ "90": {
710
+ "content": "<|reserved_80|>",
711
+ "lstrip": false,
712
+ "normalized": false,
713
+ "rstrip": false,
714
+ "single_word": false,
715
+ "special": true
716
+ },
717
+ "91": {
718
+ "content": "<|reserved_81|>",
719
+ "lstrip": false,
720
+ "normalized": false,
721
+ "rstrip": false,
722
+ "single_word": false,
723
+ "special": true
724
+ },
725
+ "92": {
726
+ "content": "<|reserved_82|>",
727
+ "lstrip": false,
728
+ "normalized": false,
729
+ "rstrip": false,
730
+ "single_word": false,
731
+ "special": true
732
+ },
733
+ "93": {
734
+ "content": "<|reserved_83|>",
735
+ "lstrip": false,
736
+ "normalized": false,
737
+ "rstrip": false,
738
+ "single_word": false,
739
+ "special": true
740
+ },
741
+ "94": {
742
+ "content": "<|reserved_84|>",
743
+ "lstrip": false,
744
+ "normalized": false,
745
+ "rstrip": false,
746
+ "single_word": false,
747
+ "special": true
748
+ },
749
+ "95": {
750
+ "content": "<|reserved_85|>",
751
+ "lstrip": false,
752
+ "normalized": false,
753
+ "rstrip": false,
754
+ "single_word": false,
755
+ "special": true
756
+ },
757
+ "96": {
758
+ "content": "<|reserved_86|>",
759
+ "lstrip": false,
760
+ "normalized": false,
761
+ "rstrip": false,
762
+ "single_word": false,
763
+ "special": true
764
+ },
765
+ "97": {
766
+ "content": "<|reserved_87|>",
767
+ "lstrip": false,
768
+ "normalized": false,
769
+ "rstrip": false,
770
+ "single_word": false,
771
+ "special": true
772
+ },
773
+ "98": {
774
+ "content": "<|reserved_88|>",
775
+ "lstrip": false,
776
+ "normalized": false,
777
+ "rstrip": false,
778
+ "single_word": false,
779
+ "special": true
780
+ },
781
+ "99": {
782
+ "content": "<|reserved_89|>",
783
+ "lstrip": false,
784
+ "normalized": false,
785
+ "rstrip": false,
786
+ "single_word": false,
787
+ "special": true
788
+ },
789
+ "100": {
790
+ "content": "<|reserved_90|>",
791
+ "lstrip": false,
792
+ "normalized": false,
793
+ "rstrip": false,
794
+ "single_word": false,
795
+ "special": true
796
+ },
797
+ "101": {
798
+ "content": "<|reserved_91|>",
799
+ "lstrip": false,
800
+ "normalized": false,
801
+ "rstrip": false,
802
+ "single_word": false,
803
+ "special": true
804
+ },
805
+ "102": {
806
+ "content": "<|reserved_92|>",
807
+ "lstrip": false,
808
+ "normalized": false,
809
+ "rstrip": false,
810
+ "single_word": false,
811
+ "special": true
812
+ },
813
+ "103": {
814
+ "content": "<|reserved_93|>",
815
+ "lstrip": false,
816
+ "normalized": false,
817
+ "rstrip": false,
818
+ "single_word": false,
819
+ "special": true
820
+ },
821
+ "104": {
822
+ "content": "<|reserved_94|>",
823
+ "lstrip": false,
824
+ "normalized": false,
825
+ "rstrip": false,
826
+ "single_word": false,
827
+ "special": true
828
+ },
829
+ "105": {
830
+ "content": "<|reserved_95|>",
831
+ "lstrip": false,
832
+ "normalized": false,
833
+ "rstrip": false,
834
+ "single_word": false,
835
+ "special": true
836
+ },
837
+ "106": {
838
+ "content": "<|reserved_96|>",
839
+ "lstrip": false,
840
+ "normalized": false,
841
+ "rstrip": false,
842
+ "single_word": false,
843
+ "special": true
844
+ },
845
+ "107": {
846
+ "content": "<|reserved_97|>",
847
+ "lstrip": false,
848
+ "normalized": false,
849
+ "rstrip": false,
850
+ "single_word": false,
851
+ "special": true
852
+ },
853
+ "108": {
854
+ "content": "<|reserved_98|>",
855
+ "lstrip": false,
856
+ "normalized": false,
857
+ "rstrip": false,
858
+ "single_word": false,
859
+ "special": true
860
+ },
861
+ "109": {
862
+ "content": "<|reserved_99|>",
863
+ "lstrip": false,
864
+ "normalized": false,
865
+ "rstrip": false,
866
+ "single_word": false,
867
+ "special": true
868
+ },
869
+ "110": {
870
+ "content": "<|reserved_100|>",
871
+ "lstrip": false,
872
+ "normalized": false,
873
+ "rstrip": false,
874
+ "single_word": false,
875
+ "special": true
876
+ },
877
+ "111": {
878
+ "content": "<|reserved_101|>",
879
+ "lstrip": false,
880
+ "normalized": false,
881
+ "rstrip": false,
882
+ "single_word": false,
883
+ "special": true
884
+ },
885
+ "112": {
886
+ "content": "<|reserved_102|>",
887
+ "lstrip": false,
888
+ "normalized": false,
889
+ "rstrip": false,
890
+ "single_word": false,
891
+ "special": true
892
+ },
893
+ "113": {
894
+ "content": "<|reserved_103|>",
895
+ "lstrip": false,
896
+ "normalized": false,
897
+ "rstrip": false,
898
+ "single_word": false,
899
+ "special": true
900
+ },
901
+ "114": {
902
+ "content": "<|reserved_104|>",
903
+ "lstrip": false,
904
+ "normalized": false,
905
+ "rstrip": false,
906
+ "single_word": false,
907
+ "special": true
908
+ },
909
+ "115": {
910
+ "content": "<|reserved_105|>",
911
+ "lstrip": false,
912
+ "normalized": false,
913
+ "rstrip": false,
914
+ "single_word": false,
915
+ "special": true
916
+ },
917
+ "116": {
918
+ "content": "<|reserved_106|>",
919
+ "lstrip": false,
920
+ "normalized": false,
921
+ "rstrip": false,
922
+ "single_word": false,
923
+ "special": true
924
+ },
925
+ "117": {
926
+ "content": "<|reserved_107|>",
927
+ "lstrip": false,
928
+ "normalized": false,
929
+ "rstrip": false,
930
+ "single_word": false,
931
+ "special": true
932
+ },
933
+ "118": {
934
+ "content": "<|reserved_108|>",
935
+ "lstrip": false,
936
+ "normalized": false,
937
+ "rstrip": false,
938
+ "single_word": false,
939
+ "special": true
940
+ },
941
+ "119": {
942
+ "content": "<|reserved_109|>",
943
+ "lstrip": false,
944
+ "normalized": false,
945
+ "rstrip": false,
946
+ "single_word": false,
947
+ "special": true
948
+ },
949
+ "120": {
950
+ "content": "<|reserved_110|>",
951
+ "lstrip": false,
952
+ "normalized": false,
953
+ "rstrip": false,
954
+ "single_word": false,
955
+ "special": true
956
+ },
957
+ "121": {
958
+ "content": "<|reserved_111|>",
959
+ "lstrip": false,
960
+ "normalized": false,
961
+ "rstrip": false,
962
+ "single_word": false,
963
+ "special": true
964
+ },
965
+ "122": {
966
+ "content": "<|reserved_112|>",
967
+ "lstrip": false,
968
+ "normalized": false,
969
+ "rstrip": false,
970
+ "single_word": false,
971
+ "special": true
972
+ },
973
+ "123": {
974
+ "content": "<|reserved_113|>",
975
+ "lstrip": false,
976
+ "normalized": false,
977
+ "rstrip": false,
978
+ "single_word": false,
979
+ "special": true
980
+ },
981
+ "124": {
982
+ "content": "<|reserved_114|>",
983
+ "lstrip": false,
984
+ "normalized": false,
985
+ "rstrip": false,
986
+ "single_word": false,
987
+ "special": true
988
+ },
989
+ "125": {
990
+ "content": "<|reserved_115|>",
991
+ "lstrip": false,
992
+ "normalized": false,
993
+ "rstrip": false,
994
+ "single_word": false,
995
+ "special": true
996
+ },
997
+ "126": {
998
+ "content": "<|reserved_116|>",
999
+ "lstrip": false,
1000
+ "normalized": false,
1001
+ "rstrip": false,
1002
+ "single_word": false,
1003
+ "special": true
1004
+ },
1005
+ "127": {
1006
+ "content": "<|reserved_117|>",
1007
+ "lstrip": false,
1008
+ "normalized": false,
1009
+ "rstrip": false,
1010
+ "single_word": false,
1011
+ "special": true
1012
+ },
1013
+ "128": {
1014
+ "content": "<|audio_start|>",
1015
+ "lstrip": false,
1016
+ "normalized": false,
1017
+ "rstrip": false,
1018
+ "single_word": false,
1019
+ "special": true
1020
+ },
1021
+ "129": {
1022
+ "content": "<|text_start|>",
1023
+ "lstrip": false,
1024
+ "normalized": false,
1025
+ "rstrip": false,
1026
+ "single_word": false,
1027
+ "special": true
1028
+ },
1029
+ "130": {
1030
+ "content": "<|text_end|>",
1031
+ "lstrip": false,
1032
+ "normalized": false,
1033
+ "rstrip": false,
1034
+ "single_word": false,
1035
+ "special": true
1036
+ },
1037
+ "131": {
1038
+ "content": "<|mixed_start|>",
1039
+ "lstrip": false,
1040
+ "normalized": false,
1041
+ "rstrip": false,
1042
+ "single_word": false,
1043
+ "special": true
1044
+ },
1045
+ "132": {
1046
+ "content": "<|mixed_end|>",
1047
+ "lstrip": false,
1048
+ "normalized": false,
1049
+ "rstrip": false,
1050
+ "single_word": false,
1051
+ "special": true
1052
+ },
1053
+ "133": {
1054
+ "content": "<|reserved_123|>",
1055
+ "lstrip": false,
1056
+ "normalized": false,
1057
+ "rstrip": false,
1058
+ "single_word": false,
1059
+ "special": true
1060
+ },
1061
+ "134": {
1062
+ "content": "<|reserved_124|>",
1063
+ "lstrip": false,
1064
+ "normalized": false,
1065
+ "rstrip": false,
1066
+ "single_word": false,
1067
+ "special": true
1068
+ },
1069
+ "135": {
1070
+ "content": "<|reserved_125|>",
1071
+ "lstrip": false,
1072
+ "normalized": false,
1073
+ "rstrip": false,
1074
+ "single_word": false,
1075
+ "special": true
1076
+ },
1077
+ "136": {
1078
+ "content": "<|reserved_126|>",
1079
+ "lstrip": false,
1080
+ "normalized": false,
1081
+ "rstrip": false,
1082
+ "single_word": false,
1083
+ "special": true
1084
+ },
1085
+ "137": {
1086
+ "content": "<|reserved_127|>",
1087
+ "lstrip": false,
1088
+ "normalized": false,
1089
+ "rstrip": false,
1090
+ "single_word": false,
1091
+ "special": true
1092
+ },
1093
+ "138": {
1094
+ "content": "<|reserved_128|>",
1095
+ "lstrip": false,
1096
+ "normalized": false,
1097
+ "rstrip": false,
1098
+ "single_word": false,
1099
+ "special": true
1100
+ },
1101
+ "139": {
1102
+ "content": "<|reserved_129|>",
1103
+ "lstrip": false,
1104
+ "normalized": false,
1105
+ "rstrip": false,
1106
+ "single_word": false,
1107
+ "special": true
1108
+ },
1109
+ "140": {
1110
+ "content": "<|reserved_130|>",
1111
+ "lstrip": false,
1112
+ "normalized": false,
1113
+ "rstrip": false,
1114
+ "single_word": false,
1115
+ "special": true
1116
+ },
1117
+ "141": {
1118
+ "content": "<|reserved_131|>",
1119
+ "lstrip": false,
1120
+ "normalized": false,
1121
+ "rstrip": false,
1122
+ "single_word": false,
1123
+ "special": true
1124
+ },
1125
+ "142": {
1126
+ "content": "<|reserved_132|>",
1127
+ "lstrip": false,
1128
+ "normalized": false,
1129
+ "rstrip": false,
1130
+ "single_word": false,
1131
+ "special": true
1132
+ },
1133
+ "143": {
1134
+ "content": "<|reserved_133|>",
1135
+ "lstrip": false,
1136
+ "normalized": false,
1137
+ "rstrip": false,
1138
+ "single_word": false,
1139
+ "special": true
1140
+ },
1141
+ "144": {
1142
+ "content": "<|reserved_134|>",
1143
+ "lstrip": false,
1144
+ "normalized": false,
1145
+ "rstrip": false,
1146
+ "single_word": false,
1147
+ "special": true
1148
+ },
1149
+ "145": {
1150
+ "content": "<|reserved_135|>",
1151
+ "lstrip": false,
1152
+ "normalized": false,
1153
+ "rstrip": false,
1154
+ "single_word": false,
1155
+ "special": true
1156
+ },
1157
+ "146": {
1158
+ "content": "<|reserved_136|>",
1159
+ "lstrip": false,
1160
+ "normalized": false,
1161
+ "rstrip": false,
1162
+ "single_word": false,
1163
+ "special": true
1164
+ },
1165
+ "147": {
1166
+ "content": "<|reserved_137|>",
1167
+ "lstrip": false,
1168
+ "normalized": false,
1169
+ "rstrip": false,
1170
+ "single_word": false,
1171
+ "special": true
1172
+ },
1173
+ "148": {
1174
+ "content": "<|reserved_138|>",
1175
+ "lstrip": false,
1176
+ "normalized": false,
1177
+ "rstrip": false,
1178
+ "single_word": false,
1179
+ "special": true
1180
+ },
1181
+ "149": {
1182
+ "content": "<|reserved_139|>",
1183
+ "lstrip": false,
1184
+ "normalized": false,
1185
+ "rstrip": false,
1186
+ "single_word": false,
1187
+ "special": true
1188
+ },
1189
+ "150": {
1190
+ "content": "<|reserved_140|>",
1191
+ "lstrip": false,
1192
+ "normalized": false,
1193
+ "rstrip": false,
1194
+ "single_word": false,
1195
+ "special": true
1196
+ },
1197
+ "151": {
1198
+ "content": "<|reserved_141|>",
1199
+ "lstrip": false,
1200
+ "normalized": false,
1201
+ "rstrip": false,
1202
+ "single_word": false,
1203
+ "special": true
1204
+ },
1205
+ "152": {
1206
+ "content": "<|reserved_142|>",
1207
+ "lstrip": false,
1208
+ "normalized": false,
1209
+ "rstrip": false,
1210
+ "single_word": false,
1211
+ "special": true
1212
+ },
1213
+ "153": {
1214
+ "content": "<|reserved_143|>",
1215
+ "lstrip": false,
1216
+ "normalized": false,
1217
+ "rstrip": false,
1218
+ "single_word": false,
1219
+ "special": true
1220
+ },
1221
+ "154": {
1222
+ "content": "<|reserved_144|>",
1223
+ "lstrip": false,
1224
+ "normalized": false,
1225
+ "rstrip": false,
1226
+ "single_word": false,
1227
+ "special": true
1228
+ },
1229
+ "155": {
1230
+ "content": "<|reserved_145|>",
1231
+ "lstrip": false,
1232
+ "normalized": false,
1233
+ "rstrip": false,
1234
+ "single_word": false,
1235
+ "special": true
1236
+ },
1237
+ "156": {
1238
+ "content": "<|reserved_146|>",
1239
+ "lstrip": false,
1240
+ "normalized": false,
1241
+ "rstrip": false,
1242
+ "single_word": false,
1243
+ "special": true
1244
+ },
1245
+ "157": {
1246
+ "content": "<|reserved_147|>",
1247
+ "lstrip": false,
1248
+ "normalized": false,
1249
+ "rstrip": false,
1250
+ "single_word": false,
1251
+ "special": true
1252
+ },
1253
+ "158": {
1254
+ "content": "<|reserved_148|>",
1255
+ "lstrip": false,
1256
+ "normalized": false,
1257
+ "rstrip": false,
1258
+ "single_word": false,
1259
+ "special": true
1260
+ },
1261
+ "159": {
1262
+ "content": "<|reserved_149|>",
1263
+ "lstrip": false,
1264
+ "normalized": false,
1265
+ "rstrip": false,
1266
+ "single_word": false,
1267
+ "special": true
1268
+ },
1269
+ "160": {
1270
+ "content": "<|reserved_150|>",
1271
+ "lstrip": false,
1272
+ "normalized": false,
1273
+ "rstrip": false,
1274
+ "single_word": false,
1275
+ "special": true
1276
+ },
1277
+ "161": {
1278
+ "content": "<|reserved_151|>",
1279
+ "lstrip": false,
1280
+ "normalized": false,
1281
+ "rstrip": false,
1282
+ "single_word": false,
1283
+ "special": true
1284
+ },
1285
+ "162": {
1286
+ "content": "<|reserved_152|>",
1287
+ "lstrip": false,
1288
+ "normalized": false,
1289
+ "rstrip": false,
1290
+ "single_word": false,
1291
+ "special": true
1292
+ },
1293
+ "163": {
1294
+ "content": "<|reserved_153|>",
1295
+ "lstrip": false,
1296
+ "normalized": false,
1297
+ "rstrip": false,
1298
+ "single_word": false,
1299
+ "special": true
1300
+ },
1301
+ "164": {
1302
+ "content": "<|reserved_154|>",
1303
+ "lstrip": false,
1304
+ "normalized": false,
1305
+ "rstrip": false,
1306
+ "single_word": false,
1307
+ "special": true
1308
+ },
1309
+ "165": {
1310
+ "content": "<|reserved_155|>",
1311
+ "lstrip": false,
1312
+ "normalized": false,
1313
+ "rstrip": false,
1314
+ "single_word": false,
1315
+ "special": true
1316
+ },
1317
+ "166": {
1318
+ "content": "<|reserved_156|>",
1319
+ "lstrip": false,
1320
+ "normalized": false,
1321
+ "rstrip": false,
1322
+ "single_word": false,
1323
+ "special": true
1324
+ },
1325
+ "167": {
1326
+ "content": "<|reserved_157|>",
1327
+ "lstrip": false,
1328
+ "normalized": false,
1329
+ "rstrip": false,
1330
+ "single_word": false,
1331
+ "special": true
1332
+ },
1333
+ "168": {
1334
+ "content": "<|reserved_158|>",
1335
+ "lstrip": false,
1336
+ "normalized": false,
1337
+ "rstrip": false,
1338
+ "single_word": false,
1339
+ "special": true
1340
+ },
1341
+ "169": {
1342
+ "content": "<|reserved_159|>",
1343
+ "lstrip": false,
1344
+ "normalized": false,
1345
+ "rstrip": false,
1346
+ "single_word": false,
1347
+ "special": true
1348
+ },
1349
+ "170": {
1350
+ "content": "<|reserved_160|>",
1351
+ "lstrip": false,
1352
+ "normalized": false,
1353
+ "rstrip": false,
1354
+ "single_word": false,
1355
+ "special": true
1356
+ },
1357
+ "171": {
1358
+ "content": "<|reserved_161|>",
1359
+ "lstrip": false,
1360
+ "normalized": false,
1361
+ "rstrip": false,
1362
+ "single_word": false,
1363
+ "special": true
1364
+ },
1365
+ "172": {
1366
+ "content": "<|reserved_162|>",
1367
+ "lstrip": false,
1368
+ "normalized": false,
1369
+ "rstrip": false,
1370
+ "single_word": false,
1371
+ "special": true
1372
+ },
1373
+ "173": {
1374
+ "content": "<|reserved_163|>",
1375
+ "lstrip": false,
1376
+ "normalized": false,
1377
+ "rstrip": false,
1378
+ "single_word": false,
1379
+ "special": true
1380
+ },
1381
+ "174": {
1382
+ "content": "<|reserved_164|>",
1383
+ "lstrip": false,
1384
+ "normalized": false,
1385
+ "rstrip": false,
1386
+ "single_word": false,
1387
+ "special": true
1388
+ },
1389
+ "175": {
1390
+ "content": "<|reserved_165|>",
1391
+ "lstrip": false,
1392
+ "normalized": false,
1393
+ "rstrip": false,
1394
+ "single_word": false,
1395
+ "special": true
1396
+ },
1397
+ "176": {
1398
+ "content": "<|reserved_166|>",
1399
+ "lstrip": false,
1400
+ "normalized": false,
1401
+ "rstrip": false,
1402
+ "single_word": false,
1403
+ "special": true
1404
+ },
1405
+ "177": {
1406
+ "content": "<|reserved_167|>",
1407
+ "lstrip": false,
1408
+ "normalized": false,
1409
+ "rstrip": false,
1410
+ "single_word": false,
1411
+ "special": true
1412
+ },
1413
+ "178": {
1414
+ "content": "<|reserved_168|>",
1415
+ "lstrip": false,
1416
+ "normalized": false,
1417
+ "rstrip": false,
1418
+ "single_word": false,
1419
+ "special": true
1420
+ },
1421
+ "179": {
1422
+ "content": "<|reserved_169|>",
1423
+ "lstrip": false,
1424
+ "normalized": false,
1425
+ "rstrip": false,
1426
+ "single_word": false,
1427
+ "special": true
1428
+ },
1429
+ "180": {
1430
+ "content": "<|reserved_170|>",
1431
+ "lstrip": false,
1432
+ "normalized": false,
1433
+ "rstrip": false,
1434
+ "single_word": false,
1435
+ "special": true
1436
+ },
1437
+ "181": {
1438
+ "content": "<|reserved_171|>",
1439
+ "lstrip": false,
1440
+ "normalized": false,
1441
+ "rstrip": false,
1442
+ "single_word": false,
1443
+ "special": true
1444
+ },
1445
+ "182": {
1446
+ "content": "<|reserved_172|>",
1447
+ "lstrip": false,
1448
+ "normalized": false,
1449
+ "rstrip": false,
1450
+ "single_word": false,
1451
+ "special": true
1452
+ },
1453
+ "183": {
1454
+ "content": "<|reserved_173|>",
1455
+ "lstrip": false,
1456
+ "normalized": false,
1457
+ "rstrip": false,
1458
+ "single_word": false,
1459
+ "special": true
1460
+ },
1461
+ "184": {
1462
+ "content": "<|reserved_174|>",
1463
+ "lstrip": false,
1464
+ "normalized": false,
1465
+ "rstrip": false,
1466
+ "single_word": false,
1467
+ "special": true
1468
+ },
1469
+ "185": {
1470
+ "content": "<|reserved_175|>",
1471
+ "lstrip": false,
1472
+ "normalized": false,
1473
+ "rstrip": false,
1474
+ "single_word": false,
1475
+ "special": true
1476
+ },
1477
+ "186": {
1478
+ "content": "<|reserved_176|>",
1479
+ "lstrip": false,
1480
+ "normalized": false,
1481
+ "rstrip": false,
1482
+ "single_word": false,
1483
+ "special": true
1484
+ },
1485
+ "187": {
1486
+ "content": "<|reserved_177|>",
1487
+ "lstrip": false,
1488
+ "normalized": false,
1489
+ "rstrip": false,
1490
+ "single_word": false,
1491
+ "special": true
1492
+ },
1493
+ "188": {
1494
+ "content": "<|reserved_178|>",
1495
+ "lstrip": false,
1496
+ "normalized": false,
1497
+ "rstrip": false,
1498
+ "single_word": false,
1499
+ "special": true
1500
+ },
1501
+ "189": {
1502
+ "content": "<|reserved_179|>",
1503
+ "lstrip": false,
1504
+ "normalized": false,
1505
+ "rstrip": false,
1506
+ "single_word": false,
1507
+ "special": true
1508
+ },
1509
+ "190": {
1510
+ "content": "<|reserved_180|>",
1511
+ "lstrip": false,
1512
+ "normalized": false,
1513
+ "rstrip": false,
1514
+ "single_word": false,
1515
+ "special": true
1516
+ },
1517
+ "191": {
1518
+ "content": "<|reserved_181|>",
1519
+ "lstrip": false,
1520
+ "normalized": false,
1521
+ "rstrip": false,
1522
+ "single_word": false,
1523
+ "special": true
1524
+ },
1525
+ "192": {
1526
+ "content": "<|reserved_182|>",
1527
+ "lstrip": false,
1528
+ "normalized": false,
1529
+ "rstrip": false,
1530
+ "single_word": false,
1531
+ "special": true
1532
+ },
1533
+ "193": {
1534
+ "content": "<|reserved_183|>",
1535
+ "lstrip": false,
1536
+ "normalized": false,
1537
+ "rstrip": false,
1538
+ "single_word": false,
1539
+ "special": true
1540
+ },
1541
+ "194": {
1542
+ "content": "<|reserved_184|>",
1543
+ "lstrip": false,
1544
+ "normalized": false,
1545
+ "rstrip": false,
1546
+ "single_word": false,
1547
+ "special": true
1548
+ },
1549
+ "195": {
1550
+ "content": "<|reserved_185|>",
1551
+ "lstrip": false,
1552
+ "normalized": false,
1553
+ "rstrip": false,
1554
+ "single_word": false,
1555
+ "special": true
1556
+ },
1557
+ "196": {
1558
+ "content": "<|reserved_186|>",
1559
+ "lstrip": false,
1560
+ "normalized": false,
1561
+ "rstrip": false,
1562
+ "single_word": false,
1563
+ "special": true
1564
+ },
1565
+ "197": {
1566
+ "content": "<|reserved_187|>",
1567
+ "lstrip": false,
1568
+ "normalized": false,
1569
+ "rstrip": false,
1570
+ "single_word": false,
1571
+ "special": true
1572
+ },
1573
+ "198": {
1574
+ "content": "<|reserved_188|>",
1575
+ "lstrip": false,
1576
+ "normalized": false,
1577
+ "rstrip": false,
1578
+ "single_word": false,
1579
+ "special": true
1580
+ },
1581
+ "199": {
1582
+ "content": "<|reserved_189|>",
1583
+ "lstrip": false,
1584
+ "normalized": false,
1585
+ "rstrip": false,
1586
+ "single_word": false,
1587
+ "special": true
1588
+ },
1589
+ "200": {
1590
+ "content": "<|reserved_190|>",
1591
+ "lstrip": false,
1592
+ "normalized": false,
1593
+ "rstrip": false,
1594
+ "single_word": false,
1595
+ "special": true
1596
+ },
1597
+ "201": {
1598
+ "content": "<|reserved_191|>",
1599
+ "lstrip": false,
1600
+ "normalized": false,
1601
+ "rstrip": false,
1602
+ "single_word": false,
1603
+ "special": true
1604
+ },
1605
+ "202": {
1606
+ "content": "<|reserved_192|>",
1607
+ "lstrip": false,
1608
+ "normalized": false,
1609
+ "rstrip": false,
1610
+ "single_word": false,
1611
+ "special": true
1612
+ },
1613
+ "203": {
1614
+ "content": "<|reserved_193|>",
1615
+ "lstrip": false,
1616
+ "normalized": false,
1617
+ "rstrip": false,
1618
+ "single_word": false,
1619
+ "special": true
1620
+ },
1621
+ "204": {
1622
+ "content": "<|reserved_194|>",
1623
+ "lstrip": false,
1624
+ "normalized": false,
1625
+ "rstrip": false,
1626
+ "single_word": false,
1627
+ "special": true
1628
+ },
1629
+ "205": {
1630
+ "content": "<|reserved_195|>",
1631
+ "lstrip": false,
1632
+ "normalized": false,
1633
+ "rstrip": false,
1634
+ "single_word": false,
1635
+ "special": true
1636
+ },
1637
+ "206": {
1638
+ "content": "<|reserved_196|>",
1639
+ "lstrip": false,
1640
+ "normalized": false,
1641
+ "rstrip": false,
1642
+ "single_word": false,
1643
+ "special": true
1644
+ },
1645
+ "207": {
1646
+ "content": "<|reserved_197|>",
1647
+ "lstrip": false,
1648
+ "normalized": false,
1649
+ "rstrip": false,
1650
+ "single_word": false,
1651
+ "special": true
1652
+ },
1653
+ "208": {
1654
+ "content": "<|reserved_198|>",
1655
+ "lstrip": false,
1656
+ "normalized": false,
1657
+ "rstrip": false,
1658
+ "single_word": false,
1659
+ "special": true
1660
+ },
1661
+ "209": {
1662
+ "content": "<|reserved_199|>",
1663
+ "lstrip": false,
1664
+ "normalized": false,
1665
+ "rstrip": false,
1666
+ "single_word": false,
1667
+ "special": true
1668
+ },
1669
+ "210": {
1670
+ "content": "<|reserved_200|>",
1671
+ "lstrip": false,
1672
+ "normalized": false,
1673
+ "rstrip": false,
1674
+ "single_word": false,
1675
+ "special": true
1676
+ },
1677
+ "211": {
1678
+ "content": "<|reserved_201|>",
1679
+ "lstrip": false,
1680
+ "normalized": false,
1681
+ "rstrip": false,
1682
+ "single_word": false,
1683
+ "special": true
1684
+ },
1685
+ "212": {
1686
+ "content": "<|reserved_202|>",
1687
+ "lstrip": false,
1688
+ "normalized": false,
1689
+ "rstrip": false,
1690
+ "single_word": false,
1691
+ "special": true
1692
+ },
1693
+ "213": {
1694
+ "content": "<|reserved_203|>",
1695
+ "lstrip": false,
1696
+ "normalized": false,
1697
+ "rstrip": false,
1698
+ "single_word": false,
1699
+ "special": true
1700
+ },
1701
+ "214": {
1702
+ "content": "<|reserved_204|>",
1703
+ "lstrip": false,
1704
+ "normalized": false,
1705
+ "rstrip": false,
1706
+ "single_word": false,
1707
+ "special": true
1708
+ },
1709
+ "215": {
1710
+ "content": "<|reserved_205|>",
1711
+ "lstrip": false,
1712
+ "normalized": false,
1713
+ "rstrip": false,
1714
+ "single_word": false,
1715
+ "special": true
1716
+ },
1717
+ "216": {
1718
+ "content": "<|reserved_206|>",
1719
+ "lstrip": false,
1720
+ "normalized": false,
1721
+ "rstrip": false,
1722
+ "single_word": false,
1723
+ "special": true
1724
+ },
1725
+ "217": {
1726
+ "content": "<|reserved_207|>",
1727
+ "lstrip": false,
1728
+ "normalized": false,
1729
+ "rstrip": false,
1730
+ "single_word": false,
1731
+ "special": true
1732
+ },
1733
+ "218": {
1734
+ "content": "<|reserved_208|>",
1735
+ "lstrip": false,
1736
+ "normalized": false,
1737
+ "rstrip": false,
1738
+ "single_word": false,
1739
+ "special": true
1740
+ },
1741
+ "219": {
1742
+ "content": "<|reserved_209|>",
1743
+ "lstrip": false,
1744
+ "normalized": false,
1745
+ "rstrip": false,
1746
+ "single_word": false,
1747
+ "special": true
1748
+ },
1749
+ "220": {
1750
+ "content": "<|reserved_210|>",
1751
+ "lstrip": false,
1752
+ "normalized": false,
1753
+ "rstrip": false,
1754
+ "single_word": false,
1755
+ "special": true
1756
+ },
1757
+ "221": {
1758
+ "content": "<|reserved_211|>",
1759
+ "lstrip": false,
1760
+ "normalized": false,
1761
+ "rstrip": false,
1762
+ "single_word": false,
1763
+ "special": true
1764
+ },
1765
+ "222": {
1766
+ "content": "<|reserved_212|>",
1767
+ "lstrip": false,
1768
+ "normalized": false,
1769
+ "rstrip": false,
1770
+ "single_word": false,
1771
+ "special": true
1772
+ },
1773
+ "223": {
1774
+ "content": "<|reserved_213|>",
1775
+ "lstrip": false,
1776
+ "normalized": false,
1777
+ "rstrip": false,
1778
+ "single_word": false,
1779
+ "special": true
1780
+ },
1781
+ "224": {
1782
+ "content": "<|reserved_214|>",
1783
+ "lstrip": false,
1784
+ "normalized": false,
1785
+ "rstrip": false,
1786
+ "single_word": false,
1787
+ "special": true
1788
+ },
1789
+ "225": {
1790
+ "content": "<|reserved_215|>",
1791
+ "lstrip": false,
1792
+ "normalized": false,
1793
+ "rstrip": false,
1794
+ "single_word": false,
1795
+ "special": true
1796
+ },
1797
+ "226": {
1798
+ "content": "<|reserved_216|>",
1799
+ "lstrip": false,
1800
+ "normalized": false,
1801
+ "rstrip": false,
1802
+ "single_word": false,
1803
+ "special": true
1804
+ },
1805
+ "227": {
1806
+ "content": "<|reserved_217|>",
1807
+ "lstrip": false,
1808
+ "normalized": false,
1809
+ "rstrip": false,
1810
+ "single_word": false,
1811
+ "special": true
1812
+ },
1813
+ "228": {
1814
+ "content": "<|reserved_218|>",
1815
+ "lstrip": false,
1816
+ "normalized": false,
1817
+ "rstrip": false,
1818
+ "single_word": false,
1819
+ "special": true
1820
+ },
1821
+ "229": {
1822
+ "content": "<|reserved_219|>",
1823
+ "lstrip": false,
1824
+ "normalized": false,
1825
+ "rstrip": false,
1826
+ "single_word": false,
1827
+ "special": true
1828
+ },
1829
+ "230": {
1830
+ "content": "<|reserved_220|>",
1831
+ "lstrip": false,
1832
+ "normalized": false,
1833
+ "rstrip": false,
1834
+ "single_word": false,
1835
+ "special": true
1836
+ },
1837
+ "231": {
1838
+ "content": "<|reserved_221|>",
1839
+ "lstrip": false,
1840
+ "normalized": false,
1841
+ "rstrip": false,
1842
+ "single_word": false,
1843
+ "special": true
1844
+ },
1845
+ "232": {
1846
+ "content": "<|reserved_222|>",
1847
+ "lstrip": false,
1848
+ "normalized": false,
1849
+ "rstrip": false,
1850
+ "single_word": false,
1851
+ "special": true
1852
+ },
1853
+ "233": {
1854
+ "content": "<|reserved_223|>",
1855
+ "lstrip": false,
1856
+ "normalized": false,
1857
+ "rstrip": false,
1858
+ "single_word": false,
1859
+ "special": true
1860
+ },
1861
+ "234": {
1862
+ "content": "<|reserved_224|>",
1863
+ "lstrip": false,
1864
+ "normalized": false,
1865
+ "rstrip": false,
1866
+ "single_word": false,
1867
+ "special": true
1868
+ },
1869
+ "235": {
1870
+ "content": "<|reserved_225|>",
1871
+ "lstrip": false,
1872
+ "normalized": false,
1873
+ "rstrip": false,
1874
+ "single_word": false,
1875
+ "special": true
1876
+ },
1877
+ "236": {
1878
+ "content": "<|reserved_226|>",
1879
+ "lstrip": false,
1880
+ "normalized": false,
1881
+ "rstrip": false,
1882
+ "single_word": false,
1883
+ "special": true
1884
+ },
1885
+ "237": {
1886
+ "content": "<|reserved_227|>",
1887
+ "lstrip": false,
1888
+ "normalized": false,
1889
+ "rstrip": false,
1890
+ "single_word": false,
1891
+ "special": true
1892
+ },
1893
+ "238": {
1894
+ "content": "<|reserved_228|>",
1895
+ "lstrip": false,
1896
+ "normalized": false,
1897
+ "rstrip": false,
1898
+ "single_word": false,
1899
+ "special": true
1900
+ },
1901
+ "239": {
1902
+ "content": "<|reserved_229|>",
1903
+ "lstrip": false,
1904
+ "normalized": false,
1905
+ "rstrip": false,
1906
+ "single_word": false,
1907
+ "special": true
1908
+ },
1909
+ "240": {
1910
+ "content": "<|reserved_230|>",
1911
+ "lstrip": false,
1912
+ "normalized": false,
1913
+ "rstrip": false,
1914
+ "single_word": false,
1915
+ "special": true
1916
+ },
1917
+ "241": {
1918
+ "content": "<|reserved_231|>",
1919
+ "lstrip": false,
1920
+ "normalized": false,
1921
+ "rstrip": false,
1922
+ "single_word": false,
1923
+ "special": true
1924
+ },
1925
+ "242": {
1926
+ "content": "<|reserved_232|>",
1927
+ "lstrip": false,
1928
+ "normalized": false,
1929
+ "rstrip": false,
1930
+ "single_word": false,
1931
+ "special": true
1932
+ },
1933
+ "243": {
1934
+ "content": "<|reserved_233|>",
1935
+ "lstrip": false,
1936
+ "normalized": false,
1937
+ "rstrip": false,
1938
+ "single_word": false,
1939
+ "special": true
1940
+ },
1941
+ "244": {
1942
+ "content": "<|reserved_234|>",
1943
+ "lstrip": false,
1944
+ "normalized": false,
1945
+ "rstrip": false,
1946
+ "single_word": false,
1947
+ "special": true
1948
+ },
1949
+ "245": {
1950
+ "content": "<|reserved_235|>",
1951
+ "lstrip": false,
1952
+ "normalized": false,
1953
+ "rstrip": false,
1954
+ "single_word": false,
1955
+ "special": true
1956
+ },
1957
+ "246": {
1958
+ "content": "<|reserved_236|>",
1959
+ "lstrip": false,
1960
+ "normalized": false,
1961
+ "rstrip": false,
1962
+ "single_word": false,
1963
+ "special": true
1964
+ },
1965
+ "247": {
1966
+ "content": "<|reserved_237|>",
1967
+ "lstrip": false,
1968
+ "normalized": false,
1969
+ "rstrip": false,
1970
+ "single_word": false,
1971
+ "special": true
1972
+ },
1973
+ "248": {
1974
+ "content": "<|reserved_238|>",
1975
+ "lstrip": false,
1976
+ "normalized": false,
1977
+ "rstrip": false,
1978
+ "single_word": false,
1979
+ "special": true
1980
+ },
1981
+ "249": {
1982
+ "content": "<|reserved_239|>",
1983
+ "lstrip": false,
1984
+ "normalized": false,
1985
+ "rstrip": false,
1986
+ "single_word": false,
1987
+ "special": true
1988
+ },
1989
+ "250": {
1990
+ "content": "<|reserved_240|>",
1991
+ "lstrip": false,
1992
+ "normalized": false,
1993
+ "rstrip": false,
1994
+ "single_word": false,
1995
+ "special": true
1996
+ },
1997
+ "251": {
1998
+ "content": "<|reserved_241|>",
1999
+ "lstrip": false,
2000
+ "normalized": false,
2001
+ "rstrip": false,
2002
+ "single_word": false,
2003
+ "special": true
2004
+ },
2005
+ "252": {
2006
+ "content": "<|reserved_242|>",
2007
+ "lstrip": false,
2008
+ "normalized": false,
2009
+ "rstrip": false,
2010
+ "single_word": false,
2011
+ "special": true
2012
+ },
2013
+ "253": {
2014
+ "content": "<|reserved_243|>",
2015
+ "lstrip": false,
2016
+ "normalized": false,
2017
+ "rstrip": false,
2018
+ "single_word": false,
2019
+ "special": true
2020
+ },
2021
+ "254": {
2022
+ "content": "<|reserved_244|>",
2023
+ "lstrip": false,
2024
+ "normalized": false,
2025
+ "rstrip": false,
2026
+ "single_word": false,
2027
+ "special": true
2028
+ },
2029
+ "255": {
2030
+ "content": "<|reserved_245|>",
2031
+ "lstrip": false,
2032
+ "normalized": false,
2033
+ "rstrip": false,
2034
+ "single_word": false,
2035
+ "special": true
2036
+ },
2037
+ "256": {
2038
+ "content": "<|reserved_246|>",
2039
+ "lstrip": false,
2040
+ "normalized": false,
2041
+ "rstrip": false,
2042
+ "single_word": false,
2043
+ "special": true
2044
+ },
2045
+ "257": {
2046
+ "content": "<|reserved_247|>",
2047
+ "lstrip": false,
2048
+ "normalized": false,
2049
+ "rstrip": false,
2050
+ "single_word": false,
2051
+ "special": true
2052
+ },
2053
+ "258": {
2054
+ "content": "<|reserved_248|>",
2055
+ "lstrip": false,
2056
+ "normalized": false,
2057
+ "rstrip": false,
2058
+ "single_word": false,
2059
+ "special": true
2060
+ },
2061
+ "259": {
2062
+ "content": "<|reserved_249|>",
2063
+ "lstrip": false,
2064
+ "normalized": false,
2065
+ "rstrip": false,
2066
+ "single_word": false,
2067
+ "special": true
2068
+ },
2069
+ "260": {
2070
+ "content": "<|reserved_250|>",
2071
+ "lstrip": false,
2072
+ "normalized": false,
2073
+ "rstrip": false,
2074
+ "single_word": false,
2075
+ "special": true
2076
+ },
2077
+ "261": {
2078
+ "content": "<|reserved_251|>",
2079
+ "lstrip": false,
2080
+ "normalized": false,
2081
+ "rstrip": false,
2082
+ "single_word": false,
2083
+ "special": true
2084
+ },
2085
+ "262": {
2086
+ "content": "<|reserved_252|>",
2087
+ "lstrip": false,
2088
+ "normalized": false,
2089
+ "rstrip": false,
2090
+ "single_word": false,
2091
+ "special": true
2092
+ },
2093
+ "263": {
2094
+ "content": "<|reserved_253|>",
2095
+ "lstrip": false,
2096
+ "normalized": false,
2097
+ "rstrip": false,
2098
+ "single_word": false,
2099
+ "special": true
2100
+ },
2101
+ "264": {
2102
+ "content": "<|reserved_254|>",
2103
+ "lstrip": false,
2104
+ "normalized": false,
2105
+ "rstrip": false,
2106
+ "single_word": false,
2107
+ "special": true
2108
+ },
2109
+ "265": {
2110
+ "content": "<|reserved_255|>",
2111
+ "lstrip": false,
2112
+ "normalized": false,
2113
+ "rstrip": false,
2114
+ "single_word": false,
2115
+ "special": true
2116
+ },
2117
+ "266": {
2118
+ "content": "<|reserved_256|>",
2119
+ "lstrip": false,
2120
+ "normalized": false,
2121
+ "rstrip": false,
2122
+ "single_word": false,
2123
+ "special": true
2124
+ },
2125
+ "267": {
2126
+ "content": "<|reserved_257|>",
2127
+ "lstrip": false,
2128
+ "normalized": false,
2129
+ "rstrip": false,
2130
+ "single_word": false,
2131
+ "special": true
2132
+ },
2133
+ "268": {
2134
+ "content": "<|reserved_258|>",
2135
+ "lstrip": false,
2136
+ "normalized": false,
2137
+ "rstrip": false,
2138
+ "single_word": false,
2139
+ "special": true
2140
+ },
2141
+ "269": {
2142
+ "content": "<|reserved_259|>",
2143
+ "lstrip": false,
2144
+ "normalized": false,
2145
+ "rstrip": false,
2146
+ "single_word": false,
2147
+ "special": true
2148
+ },
2149
+ "270": {
2150
+ "content": "<|reserved_260|>",
2151
+ "lstrip": false,
2152
+ "normalized": false,
2153
+ "rstrip": false,
2154
+ "single_word": false,
2155
+ "special": true
2156
+ },
2157
+ "271": {
2158
+ "content": "<|reserved_261|>",
2159
+ "lstrip": false,
2160
+ "normalized": false,
2161
+ "rstrip": false,
2162
+ "single_word": false,
2163
+ "special": true
2164
+ },
2165
+ "272": {
2166
+ "content": "<|reserved_262|>",
2167
+ "lstrip": false,
2168
+ "normalized": false,
2169
+ "rstrip": false,
2170
+ "single_word": false,
2171
+ "special": true
2172
+ },
2173
+ "273": {
2174
+ "content": "<|reserved_263|>",
2175
+ "lstrip": false,
2176
+ "normalized": false,
2177
+ "rstrip": false,
2178
+ "single_word": false,
2179
+ "special": true
2180
+ },
2181
+ "274": {
2182
+ "content": "<|reserved_264|>",
2183
+ "lstrip": false,
2184
+ "normalized": false,
2185
+ "rstrip": false,
2186
+ "single_word": false,
2187
+ "special": true
2188
+ },
2189
+ "275": {
2190
+ "content": "<|reserved_265|>",
2191
+ "lstrip": false,
2192
+ "normalized": false,
2193
+ "rstrip": false,
2194
+ "single_word": false,
2195
+ "special": true
2196
+ },
2197
+ "276": {
2198
+ "content": "<|reserved_266|>",
2199
+ "lstrip": false,
2200
+ "normalized": false,
2201
+ "rstrip": false,
2202
+ "single_word": false,
2203
+ "special": true
2204
+ },
2205
+ "277": {
2206
+ "content": "<|reserved_267|>",
2207
+ "lstrip": false,
2208
+ "normalized": false,
2209
+ "rstrip": false,
2210
+ "single_word": false,
2211
+ "special": true
2212
+ },
2213
+ "278": {
2214
+ "content": "<|reserved_268|>",
2215
+ "lstrip": false,
2216
+ "normalized": false,
2217
+ "rstrip": false,
2218
+ "single_word": false,
2219
+ "special": true
2220
+ },
2221
+ "279": {
2222
+ "content": "<|reserved_269|>",
2223
+ "lstrip": false,
2224
+ "normalized": false,
2225
+ "rstrip": false,
2226
+ "single_word": false,
2227
+ "special": true
2228
+ },
2229
+ "280": {
2230
+ "content": "<|reserved_270|>",
2231
+ "lstrip": false,
2232
+ "normalized": false,
2233
+ "rstrip": false,
2234
+ "single_word": false,
2235
+ "special": true
2236
+ },
2237
+ "281": {
2238
+ "content": "<|reserved_271|>",
2239
+ "lstrip": false,
2240
+ "normalized": false,
2241
+ "rstrip": false,
2242
+ "single_word": false,
2243
+ "special": true
2244
+ },
2245
+ "282": {
2246
+ "content": "<|reserved_272|>",
2247
+ "lstrip": false,
2248
+ "normalized": false,
2249
+ "rstrip": false,
2250
+ "single_word": false,
2251
+ "special": true
2252
+ },
2253
+ "283": {
2254
+ "content": "<|reserved_273|>",
2255
+ "lstrip": false,
2256
+ "normalized": false,
2257
+ "rstrip": false,
2258
+ "single_word": false,
2259
+ "special": true
2260
+ },
2261
+ "284": {
2262
+ "content": "<|reserved_274|>",
2263
+ "lstrip": false,
2264
+ "normalized": false,
2265
+ "rstrip": false,
2266
+ "single_word": false,
2267
+ "special": true
2268
+ },
2269
+ "285": {
2270
+ "content": "<|reserved_275|>",
2271
+ "lstrip": false,
2272
+ "normalized": false,
2273
+ "rstrip": false,
2274
+ "single_word": false,
2275
+ "special": true
2276
+ },
2277
+ "286": {
2278
+ "content": "<|reserved_276|>",
2279
+ "lstrip": false,
2280
+ "normalized": false,
2281
+ "rstrip": false,
2282
+ "single_word": false,
2283
+ "special": true
2284
+ },
2285
+ "287": {
2286
+ "content": "<|reserved_277|>",
2287
+ "lstrip": false,
2288
+ "normalized": false,
2289
+ "rstrip": false,
2290
+ "single_word": false,
2291
+ "special": true
2292
+ },
2293
+ "288": {
2294
+ "content": "<|reserved_278|>",
2295
+ "lstrip": false,
2296
+ "normalized": false,
2297
+ "rstrip": false,
2298
+ "single_word": false,
2299
+ "special": true
2300
+ },
2301
+ "289": {
2302
+ "content": "<|reserved_279|>",
2303
+ "lstrip": false,
2304
+ "normalized": false,
2305
+ "rstrip": false,
2306
+ "single_word": false,
2307
+ "special": true
2308
+ },
2309
+ "290": {
2310
+ "content": "<|reserved_280|>",
2311
+ "lstrip": false,
2312
+ "normalized": false,
2313
+ "rstrip": false,
2314
+ "single_word": false,
2315
+ "special": true
2316
+ },
2317
+ "291": {
2318
+ "content": "<|reserved_281|>",
2319
+ "lstrip": false,
2320
+ "normalized": false,
2321
+ "rstrip": false,
2322
+ "single_word": false,
2323
+ "special": true
2324
+ },
2325
+ "292": {
2326
+ "content": "<|reserved_282|>",
2327
+ "lstrip": false,
2328
+ "normalized": false,
2329
+ "rstrip": false,
2330
+ "single_word": false,
2331
+ "special": true
2332
+ },
2333
+ "293": {
2334
+ "content": "<|reserved_283|>",
2335
+ "lstrip": false,
2336
+ "normalized": false,
2337
+ "rstrip": false,
2338
+ "single_word": false,
2339
+ "special": true
2340
+ },
2341
+ "294": {
2342
+ "content": "<|reserved_284|>",
2343
+ "lstrip": false,
2344
+ "normalized": false,
2345
+ "rstrip": false,
2346
+ "single_word": false,
2347
+ "special": true
2348
+ },
2349
+ "295": {
2350
+ "content": "<|reserved_285|>",
2351
+ "lstrip": false,
2352
+ "normalized": false,
2353
+ "rstrip": false,
2354
+ "single_word": false,
2355
+ "special": true
2356
+ },
2357
+ "296": {
2358
+ "content": "<|reserved_286|>",
2359
+ "lstrip": false,
2360
+ "normalized": false,
2361
+ "rstrip": false,
2362
+ "single_word": false,
2363
+ "special": true
2364
+ },
2365
+ "297": {
2366
+ "content": "<|reserved_287|>",
2367
+ "lstrip": false,
2368
+ "normalized": false,
2369
+ "rstrip": false,
2370
+ "single_word": false,
2371
+ "special": true
2372
+ },
2373
+ "298": {
2374
+ "content": "<|reserved_288|>",
2375
+ "lstrip": false,
2376
+ "normalized": false,
2377
+ "rstrip": false,
2378
+ "single_word": false,
2379
+ "special": true
2380
+ },
2381
+ "299": {
2382
+ "content": "<|reserved_289|>",
2383
+ "lstrip": false,
2384
+ "normalized": false,
2385
+ "rstrip": false,
2386
+ "single_word": false,
2387
+ "special": true
2388
+ },
2389
+ "300": {
2390
+ "content": "<|reserved_290|>",
2391
+ "lstrip": false,
2392
+ "normalized": false,
2393
+ "rstrip": false,
2394
+ "single_word": false,
2395
+ "special": true
2396
+ },
2397
+ "301": {
2398
+ "content": "<|reserved_291|>",
2399
+ "lstrip": false,
2400
+ "normalized": false,
2401
+ "rstrip": false,
2402
+ "single_word": false,
2403
+ "special": true
2404
+ },
2405
+ "302": {
2406
+ "content": "<|reserved_292|>",
2407
+ "lstrip": false,
2408
+ "normalized": false,
2409
+ "rstrip": false,
2410
+ "single_word": false,
2411
+ "special": true
2412
+ },
2413
+ "303": {
2414
+ "content": "<|reserved_293|>",
2415
+ "lstrip": false,
2416
+ "normalized": false,
2417
+ "rstrip": false,
2418
+ "single_word": false,
2419
+ "special": true
2420
+ },
2421
+ "304": {
2422
+ "content": "<|reserved_294|>",
2423
+ "lstrip": false,
2424
+ "normalized": false,
2425
+ "rstrip": false,
2426
+ "single_word": false,
2427
+ "special": true
2428
+ },
2429
+ "305": {
2430
+ "content": "<|reserved_295|>",
2431
+ "lstrip": false,
2432
+ "normalized": false,
2433
+ "rstrip": false,
2434
+ "single_word": false,
2435
+ "special": true
2436
+ },
2437
+ "306": {
2438
+ "content": "<|reserved_296|>",
2439
+ "lstrip": false,
2440
+ "normalized": false,
2441
+ "rstrip": false,
2442
+ "single_word": false,
2443
+ "special": true
2444
+ },
2445
+ "307": {
2446
+ "content": "<|reserved_297|>",
2447
+ "lstrip": false,
2448
+ "normalized": false,
2449
+ "rstrip": false,
2450
+ "single_word": false,
2451
+ "special": true
2452
+ },
2453
+ "308": {
2454
+ "content": "<|reserved_298|>",
2455
+ "lstrip": false,
2456
+ "normalized": false,
2457
+ "rstrip": false,
2458
+ "single_word": false,
2459
+ "special": true
2460
+ },
2461
+ "309": {
2462
+ "content": "<|reserved_299|>",
2463
+ "lstrip": false,
2464
+ "normalized": false,
2465
+ "rstrip": false,
2466
+ "single_word": false,
2467
+ "special": true
2468
+ },
2469
+ "310": {
2470
+ "content": "<|reserved_300|>",
2471
+ "lstrip": false,
2472
+ "normalized": false,
2473
+ "rstrip": false,
2474
+ "single_word": false,
2475
+ "special": true
2476
+ },
2477
+ "311": {
2478
+ "content": "<|reserved_301|>",
2479
+ "lstrip": false,
2480
+ "normalized": false,
2481
+ "rstrip": false,
2482
+ "single_word": false,
2483
+ "special": true
2484
+ },
2485
+ "312": {
2486
+ "content": "<|reserved_302|>",
2487
+ "lstrip": false,
2488
+ "normalized": false,
2489
+ "rstrip": false,
2490
+ "single_word": false,
2491
+ "special": true
2492
+ },
2493
+ "313": {
2494
+ "content": "<|reserved_303|>",
2495
+ "lstrip": false,
2496
+ "normalized": false,
2497
+ "rstrip": false,
2498
+ "single_word": false,
2499
+ "special": true
2500
+ },
2501
+ "314": {
2502
+ "content": "<|reserved_304|>",
2503
+ "lstrip": false,
2504
+ "normalized": false,
2505
+ "rstrip": false,
2506
+ "single_word": false,
2507
+ "special": true
2508
+ },
2509
+ "315": {
2510
+ "content": "<|reserved_305|>",
2511
+ "lstrip": false,
2512
+ "normalized": false,
2513
+ "rstrip": false,
2514
+ "single_word": false,
2515
+ "special": true
2516
+ },
2517
+ "316": {
2518
+ "content": "<|reserved_306|>",
2519
+ "lstrip": false,
2520
+ "normalized": false,
2521
+ "rstrip": false,
2522
+ "single_word": false,
2523
+ "special": true
2524
+ },
2525
+ "317": {
2526
+ "content": "<|reserved_307|>",
2527
+ "lstrip": false,
2528
+ "normalized": false,
2529
+ "rstrip": false,
2530
+ "single_word": false,
2531
+ "special": true
2532
+ },
2533
+ "318": {
2534
+ "content": "<|reserved_308|>",
2535
+ "lstrip": false,
2536
+ "normalized": false,
2537
+ "rstrip": false,
2538
+ "single_word": false,
2539
+ "special": true
2540
+ },
2541
+ "319": {
2542
+ "content": "<|reserved_309|>",
2543
+ "lstrip": false,
2544
+ "normalized": false,
2545
+ "rstrip": false,
2546
+ "single_word": false,
2547
+ "special": true
2548
+ },
2549
+ "320": {
2550
+ "content": "<|reserved_310|>",
2551
+ "lstrip": false,
2552
+ "normalized": false,
2553
+ "rstrip": false,
2554
+ "single_word": false,
2555
+ "special": true
2556
+ },
2557
+ "321": {
2558
+ "content": "<|reserved_311|>",
2559
+ "lstrip": false,
2560
+ "normalized": false,
2561
+ "rstrip": false,
2562
+ "single_word": false,
2563
+ "special": true
2564
+ },
2565
+ "322": {
2566
+ "content": "<|reserved_312|>",
2567
+ "lstrip": false,
2568
+ "normalized": false,
2569
+ "rstrip": false,
2570
+ "single_word": false,
2571
+ "special": true
2572
+ },
2573
+ "323": {
2574
+ "content": "<|reserved_313|>",
2575
+ "lstrip": false,
2576
+ "normalized": false,
2577
+ "rstrip": false,
2578
+ "single_word": false,
2579
+ "special": true
2580
+ },
2581
+ "324": {
2582
+ "content": "<|reserved_314|>",
2583
+ "lstrip": false,
2584
+ "normalized": false,
2585
+ "rstrip": false,
2586
+ "single_word": false,
2587
+ "special": true
2588
+ },
2589
+ "325": {
2590
+ "content": "<|reserved_315|>",
2591
+ "lstrip": false,
2592
+ "normalized": false,
2593
+ "rstrip": false,
2594
+ "single_word": false,
2595
+ "special": true
2596
+ },
2597
+ "326": {
2598
+ "content": "<|reserved_316|>",
2599
+ "lstrip": false,
2600
+ "normalized": false,
2601
+ "rstrip": false,
2602
+ "single_word": false,
2603
+ "special": true
2604
+ },
2605
+ "327": {
2606
+ "content": "<|reserved_317|>",
2607
+ "lstrip": false,
2608
+ "normalized": false,
2609
+ "rstrip": false,
2610
+ "single_word": false,
2611
+ "special": true
2612
+ },
2613
+ "328": {
2614
+ "content": "<|reserved_318|>",
2615
+ "lstrip": false,
2616
+ "normalized": false,
2617
+ "rstrip": false,
2618
+ "single_word": false,
2619
+ "special": true
2620
+ },
2621
+ "329": {
2622
+ "content": "<|reserved_319|>",
2623
+ "lstrip": false,
2624
+ "normalized": false,
2625
+ "rstrip": false,
2626
+ "single_word": false,
2627
+ "special": true
2628
+ },
2629
+ "330": {
2630
+ "content": "<|reserved_320|>",
2631
+ "lstrip": false,
2632
+ "normalized": false,
2633
+ "rstrip": false,
2634
+ "single_word": false,
2635
+ "special": true
2636
+ },
2637
+ "331": {
2638
+ "content": "<|reserved_321|>",
2639
+ "lstrip": false,
2640
+ "normalized": false,
2641
+ "rstrip": false,
2642
+ "single_word": false,
2643
+ "special": true
2644
+ },
2645
+ "332": {
2646
+ "content": "<|reserved_322|>",
2647
+ "lstrip": false,
2648
+ "normalized": false,
2649
+ "rstrip": false,
2650
+ "single_word": false,
2651
+ "special": true
2652
+ },
2653
+ "333": {
2654
+ "content": "<|reserved_323|>",
2655
+ "lstrip": false,
2656
+ "normalized": false,
2657
+ "rstrip": false,
2658
+ "single_word": false,
2659
+ "special": true
2660
+ },
2661
+ "334": {
2662
+ "content": "<|reserved_324|>",
2663
+ "lstrip": false,
2664
+ "normalized": false,
2665
+ "rstrip": false,
2666
+ "single_word": false,
2667
+ "special": true
2668
+ },
2669
+ "335": {
2670
+ "content": "<|reserved_325|>",
2671
+ "lstrip": false,
2672
+ "normalized": false,
2673
+ "rstrip": false,
2674
+ "single_word": false,
2675
+ "special": true
2676
+ },
2677
+ "336": {
2678
+ "content": "<|reserved_326|>",
2679
+ "lstrip": false,
2680
+ "normalized": false,
2681
+ "rstrip": false,
2682
+ "single_word": false,
2683
+ "special": true
2684
+ },
2685
+ "337": {
2686
+ "content": "<|reserved_327|>",
2687
+ "lstrip": false,
2688
+ "normalized": false,
2689
+ "rstrip": false,
2690
+ "single_word": false,
2691
+ "special": true
2692
+ },
2693
+ "338": {
2694
+ "content": "<|reserved_328|>",
2695
+ "lstrip": false,
2696
+ "normalized": false,
2697
+ "rstrip": false,
2698
+ "single_word": false,
2699
+ "special": true
2700
+ },
2701
+ "339": {
2702
+ "content": "<|reserved_329|>",
2703
+ "lstrip": false,
2704
+ "normalized": false,
2705
+ "rstrip": false,
2706
+ "single_word": false,
2707
+ "special": true
2708
+ },
2709
+ "340": {
2710
+ "content": "<|reserved_330|>",
2711
+ "lstrip": false,
2712
+ "normalized": false,
2713
+ "rstrip": false,
2714
+ "single_word": false,
2715
+ "special": true
2716
+ },
2717
+ "341": {
2718
+ "content": "<|reserved_331|>",
2719
+ "lstrip": false,
2720
+ "normalized": false,
2721
+ "rstrip": false,
2722
+ "single_word": false,
2723
+ "special": true
2724
+ },
2725
+ "342": {
2726
+ "content": "<|reserved_332|>",
2727
+ "lstrip": false,
2728
+ "normalized": false,
2729
+ "rstrip": false,
2730
+ "single_word": false,
2731
+ "special": true
2732
+ },
2733
+ "343": {
2734
+ "content": "<|reserved_333|>",
2735
+ "lstrip": false,
2736
+ "normalized": false,
2737
+ "rstrip": false,
2738
+ "single_word": false,
2739
+ "special": true
2740
+ },
2741
+ "344": {
2742
+ "content": "<|reserved_334|>",
2743
+ "lstrip": false,
2744
+ "normalized": false,
2745
+ "rstrip": false,
2746
+ "single_word": false,
2747
+ "special": true
2748
+ },
2749
+ "345": {
2750
+ "content": "<|reserved_335|>",
2751
+ "lstrip": false,
2752
+ "normalized": false,
2753
+ "rstrip": false,
2754
+ "single_word": false,
2755
+ "special": true
2756
+ },
2757
+ "346": {
2758
+ "content": "<|reserved_336|>",
2759
+ "lstrip": false,
2760
+ "normalized": false,
2761
+ "rstrip": false,
2762
+ "single_word": false,
2763
+ "special": true
2764
+ },
2765
+ "347": {
2766
+ "content": "<|reserved_337|>",
2767
+ "lstrip": false,
2768
+ "normalized": false,
2769
+ "rstrip": false,
2770
+ "single_word": false,
2771
+ "special": true
2772
+ },
2773
+ "348": {
2774
+ "content": "<|reserved_338|>",
2775
+ "lstrip": false,
2776
+ "normalized": false,
2777
+ "rstrip": false,
2778
+ "single_word": false,
2779
+ "special": true
2780
+ },
2781
+ "349": {
2782
+ "content": "<|reserved_339|>",
2783
+ "lstrip": false,
2784
+ "normalized": false,
2785
+ "rstrip": false,
2786
+ "single_word": false,
2787
+ "special": true
2788
+ },
2789
+ "350": {
2790
+ "content": "<|reserved_340|>",
2791
+ "lstrip": false,
2792
+ "normalized": false,
2793
+ "rstrip": false,
2794
+ "single_word": false,
2795
+ "special": true
2796
+ },
2797
+ "351": {
2798
+ "content": "<|reserved_341|>",
2799
+ "lstrip": false,
2800
+ "normalized": false,
2801
+ "rstrip": false,
2802
+ "single_word": false,
2803
+ "special": true
2804
+ },
2805
+ "352": {
2806
+ "content": "<|reserved_342|>",
2807
+ "lstrip": false,
2808
+ "normalized": false,
2809
+ "rstrip": false,
2810
+ "single_word": false,
2811
+ "special": true
2812
+ },
2813
+ "353": {
2814
+ "content": "<|reserved_343|>",
2815
+ "lstrip": false,
2816
+ "normalized": false,
2817
+ "rstrip": false,
2818
+ "single_word": false,
2819
+ "special": true
2820
+ },
2821
+ "354": {
2822
+ "content": "<|reserved_344|>",
2823
+ "lstrip": false,
2824
+ "normalized": false,
2825
+ "rstrip": false,
2826
+ "single_word": false,
2827
+ "special": true
2828
+ },
2829
+ "355": {
2830
+ "content": "<|reserved_345|>",
2831
+ "lstrip": false,
2832
+ "normalized": false,
2833
+ "rstrip": false,
2834
+ "single_word": false,
2835
+ "special": true
2836
+ },
2837
+ "356": {
2838
+ "content": "<|reserved_346|>",
2839
+ "lstrip": false,
2840
+ "normalized": false,
2841
+ "rstrip": false,
2842
+ "single_word": false,
2843
+ "special": true
2844
+ },
2845
+ "357": {
2846
+ "content": "<|reserved_347|>",
2847
+ "lstrip": false,
2848
+ "normalized": false,
2849
+ "rstrip": false,
2850
+ "single_word": false,
2851
+ "special": true
2852
+ },
2853
+ "358": {
2854
+ "content": "<|reserved_348|>",
2855
+ "lstrip": false,
2856
+ "normalized": false,
2857
+ "rstrip": false,
2858
+ "single_word": false,
2859
+ "special": true
2860
+ },
2861
+ "359": {
2862
+ "content": "<|reserved_349|>",
2863
+ "lstrip": false,
2864
+ "normalized": false,
2865
+ "rstrip": false,
2866
+ "single_word": false,
2867
+ "special": true
2868
+ },
2869
+ "360": {
2870
+ "content": "<|reserved_350|>",
2871
+ "lstrip": false,
2872
+ "normalized": false,
2873
+ "rstrip": false,
2874
+ "single_word": false,
2875
+ "special": true
2876
+ },
2877
+ "361": {
2878
+ "content": "<|reserved_351|>",
2879
+ "lstrip": false,
2880
+ "normalized": false,
2881
+ "rstrip": false,
2882
+ "single_word": false,
2883
+ "special": true
2884
+ },
2885
+ "362": {
2886
+ "content": "<|reserved_352|>",
2887
+ "lstrip": false,
2888
+ "normalized": false,
2889
+ "rstrip": false,
2890
+ "single_word": false,
2891
+ "special": true
2892
+ },
2893
+ "363": {
2894
+ "content": "<|reserved_353|>",
2895
+ "lstrip": false,
2896
+ "normalized": false,
2897
+ "rstrip": false,
2898
+ "single_word": false,
2899
+ "special": true
2900
+ },
2901
+ "364": {
2902
+ "content": "<|reserved_354|>",
2903
+ "lstrip": false,
2904
+ "normalized": false,
2905
+ "rstrip": false,
2906
+ "single_word": false,
2907
+ "special": true
2908
+ },
2909
+ "365": {
2910
+ "content": "<|reserved_355|>",
2911
+ "lstrip": false,
2912
+ "normalized": false,
2913
+ "rstrip": false,
2914
+ "single_word": false,
2915
+ "special": true
2916
+ },
2917
+ "366": {
2918
+ "content": "<|reserved_356|>",
2919
+ "lstrip": false,
2920
+ "normalized": false,
2921
+ "rstrip": false,
2922
+ "single_word": false,
2923
+ "special": true
2924
+ },
2925
+ "367": {
2926
+ "content": "<|reserved_357|>",
2927
+ "lstrip": false,
2928
+ "normalized": false,
2929
+ "rstrip": false,
2930
+ "single_word": false,
2931
+ "special": true
2932
+ },
2933
+ "368": {
2934
+ "content": "<|reserved_358|>",
2935
+ "lstrip": false,
2936
+ "normalized": false,
2937
+ "rstrip": false,
2938
+ "single_word": false,
2939
+ "special": true
2940
+ },
2941
+ "369": {
2942
+ "content": "<|reserved_359|>",
2943
+ "lstrip": false,
2944
+ "normalized": false,
2945
+ "rstrip": false,
2946
+ "single_word": false,
2947
+ "special": true
2948
+ },
2949
+ "370": {
2950
+ "content": "<|reserved_360|>",
2951
+ "lstrip": false,
2952
+ "normalized": false,
2953
+ "rstrip": false,
2954
+ "single_word": false,
2955
+ "special": true
2956
+ },
2957
+ "371": {
2958
+ "content": "<|reserved_361|>",
2959
+ "lstrip": false,
2960
+ "normalized": false,
2961
+ "rstrip": false,
2962
+ "single_word": false,
2963
+ "special": true
2964
+ },
2965
+ "372": {
2966
+ "content": "<|reserved_362|>",
2967
+ "lstrip": false,
2968
+ "normalized": false,
2969
+ "rstrip": false,
2970
+ "single_word": false,
2971
+ "special": true
2972
+ },
2973
+ "373": {
2974
+ "content": "<|reserved_363|>",
2975
+ "lstrip": false,
2976
+ "normalized": false,
2977
+ "rstrip": false,
2978
+ "single_word": false,
2979
+ "special": true
2980
+ },
2981
+ "374": {
2982
+ "content": "<|reserved_364|>",
2983
+ "lstrip": false,
2984
+ "normalized": false,
2985
+ "rstrip": false,
2986
+ "single_word": false,
2987
+ "special": true
2988
+ },
2989
+ "375": {
2990
+ "content": "<|reserved_365|>",
2991
+ "lstrip": false,
2992
+ "normalized": false,
2993
+ "rstrip": false,
2994
+ "single_word": false,
2995
+ "special": true
2996
+ },
2997
+ "376": {
2998
+ "content": "<|reserved_366|>",
2999
+ "lstrip": false,
3000
+ "normalized": false,
3001
+ "rstrip": false,
3002
+ "single_word": false,
3003
+ "special": true
3004
+ },
3005
+ "377": {
3006
+ "content": "<|reserved_367|>",
3007
+ "lstrip": false,
3008
+ "normalized": false,
3009
+ "rstrip": false,
3010
+ "single_word": false,
3011
+ "special": true
3012
+ },
3013
+ "378": {
3014
+ "content": "<|reserved_368|>",
3015
+ "lstrip": false,
3016
+ "normalized": false,
3017
+ "rstrip": false,
3018
+ "single_word": false,
3019
+ "special": true
3020
+ },
3021
+ "379": {
3022
+ "content": "<|reserved_369|>",
3023
+ "lstrip": false,
3024
+ "normalized": false,
3025
+ "rstrip": false,
3026
+ "single_word": false,
3027
+ "special": true
3028
+ },
3029
+ "380": {
3030
+ "content": "<|reserved_370|>",
3031
+ "lstrip": false,
3032
+ "normalized": false,
3033
+ "rstrip": false,
3034
+ "single_word": false,
3035
+ "special": true
3036
+ },
3037
+ "381": {
3038
+ "content": "<|reserved_371|>",
3039
+ "lstrip": false,
3040
+ "normalized": false,
3041
+ "rstrip": false,
3042
+ "single_word": false,
3043
+ "special": true
3044
+ },
3045
+ "382": {
3046
+ "content": "<|reserved_372|>",
3047
+ "lstrip": false,
3048
+ "normalized": false,
3049
+ "rstrip": false,
3050
+ "single_word": false,
3051
+ "special": true
3052
+ },
3053
+ "383": {
3054
+ "content": "<|reserved_373|>",
3055
+ "lstrip": false,
3056
+ "normalized": false,
3057
+ "rstrip": false,
3058
+ "single_word": false,
3059
+ "special": true
3060
+ },
3061
+ "384": {
3062
+ "content": "<|reserved_374|>",
3063
+ "lstrip": false,
3064
+ "normalized": false,
3065
+ "rstrip": false,
3066
+ "single_word": false,
3067
+ "special": true
3068
+ },
3069
+ "385": {
3070
+ "content": "<|reserved_375|>",
3071
+ "lstrip": false,
3072
+ "normalized": false,
3073
+ "rstrip": false,
3074
+ "single_word": false,
3075
+ "special": true
3076
+ },
3077
+ "386": {
3078
+ "content": "<|reserved_376|>",
3079
+ "lstrip": false,
3080
+ "normalized": false,
3081
+ "rstrip": false,
3082
+ "single_word": false,
3083
+ "special": true
3084
+ },
3085
+ "387": {
3086
+ "content": "<|reserved_377|>",
3087
+ "lstrip": false,
3088
+ "normalized": false,
3089
+ "rstrip": false,
3090
+ "single_word": false,
3091
+ "special": true
3092
+ },
3093
+ "388": {
3094
+ "content": "<|reserved_378|>",
3095
+ "lstrip": false,
3096
+ "normalized": false,
3097
+ "rstrip": false,
3098
+ "single_word": false,
3099
+ "special": true
3100
+ },
3101
+ "389": {
3102
+ "content": "<|reserved_379|>",
3103
+ "lstrip": false,
3104
+ "normalized": false,
3105
+ "rstrip": false,
3106
+ "single_word": false,
3107
+ "special": true
3108
+ },
3109
+ "390": {
3110
+ "content": "<|reserved_380|>",
3111
+ "lstrip": false,
3112
+ "normalized": false,
3113
+ "rstrip": false,
3114
+ "single_word": false,
3115
+ "special": true
3116
+ },
3117
+ "391": {
3118
+ "content": "<|reserved_381|>",
3119
+ "lstrip": false,
3120
+ "normalized": false,
3121
+ "rstrip": false,
3122
+ "single_word": false,
3123
+ "special": true
3124
+ },
3125
+ "392": {
3126
+ "content": "<|reserved_382|>",
3127
+ "lstrip": false,
3128
+ "normalized": false,
3129
+ "rstrip": false,
3130
+ "single_word": false,
3131
+ "special": true
3132
+ },
3133
+ "393": {
3134
+ "content": "<|reserved_383|>",
3135
+ "lstrip": false,
3136
+ "normalized": false,
3137
+ "rstrip": false,
3138
+ "single_word": false,
3139
+ "special": true
3140
+ },
3141
+ "394": {
3142
+ "content": "<|reserved_384|>",
3143
+ "lstrip": false,
3144
+ "normalized": false,
3145
+ "rstrip": false,
3146
+ "single_word": false,
3147
+ "special": true
3148
+ },
3149
+ "395": {
3150
+ "content": "<|reserved_385|>",
3151
+ "lstrip": false,
3152
+ "normalized": false,
3153
+ "rstrip": false,
3154
+ "single_word": false,
3155
+ "special": true
3156
+ },
3157
+ "396": {
3158
+ "content": "<image>",
3159
+ "lstrip": false,
3160
+ "normalized": false,
3161
+ "rstrip": false,
3162
+ "single_word": false,
3163
+ "special": true
3164
+ },
3165
+ "397": {
3166
+ "content": "<|img_row_1_col_1|>",
3167
+ "lstrip": false,
3168
+ "normalized": false,
3169
+ "rstrip": false,
3170
+ "single_word": false,
3171
+ "special": true
3172
+ },
3173
+ "398": {
3174
+ "content": "<|img_row_1_col_2|>",
3175
+ "lstrip": false,
3176
+ "normalized": false,
3177
+ "rstrip": false,
3178
+ "single_word": false,
3179
+ "special": true
3180
+ },
3181
+ "399": {
3182
+ "content": "<|img_row_1_col_3|>",
3183
+ "lstrip": false,
3184
+ "normalized": false,
3185
+ "rstrip": false,
3186
+ "single_word": false,
3187
+ "special": true
3188
+ },
3189
+ "400": {
3190
+ "content": "<|img_row_1_col_4|>",
3191
+ "lstrip": false,
3192
+ "normalized": false,
3193
+ "rstrip": false,
3194
+ "single_word": false,
3195
+ "special": true
3196
+ },
3197
+ "401": {
3198
+ "content": "<|img_row_1_col_5|>",
3199
+ "lstrip": false,
3200
+ "normalized": false,
3201
+ "rstrip": false,
3202
+ "single_word": false,
3203
+ "special": true
3204
+ },
3205
+ "402": {
3206
+ "content": "<|img_row_1_col_6|>",
3207
+ "lstrip": false,
3208
+ "normalized": false,
3209
+ "rstrip": false,
3210
+ "single_word": false,
3211
+ "special": true
3212
+ },
3213
+ "403": {
3214
+ "content": "<|img_row_1_col_7|>",
3215
+ "lstrip": false,
3216
+ "normalized": false,
3217
+ "rstrip": false,
3218
+ "single_word": false,
3219
+ "special": true
3220
+ },
3221
+ "404": {
3222
+ "content": "<|img_row_1_col_8|>",
3223
+ "lstrip": false,
3224
+ "normalized": false,
3225
+ "rstrip": false,
3226
+ "single_word": false,
3227
+ "special": true
3228
+ },
3229
+ "405": {
3230
+ "content": "<|img_row_1_col_9|>",
3231
+ "lstrip": false,
3232
+ "normalized": false,
3233
+ "rstrip": false,
3234
+ "single_word": false,
3235
+ "special": true
3236
+ },
3237
+ "406": {
3238
+ "content": "<|img_row_1_col_10|>",
3239
+ "lstrip": false,
3240
+ "normalized": false,
3241
+ "rstrip": false,
3242
+ "single_word": false,
3243
+ "special": true
3244
+ },
3245
+ "407": {
3246
+ "content": "<|img_row_2_col_1|>",
3247
+ "lstrip": false,
3248
+ "normalized": false,
3249
+ "rstrip": false,
3250
+ "single_word": false,
3251
+ "special": true
3252
+ },
3253
+ "408": {
3254
+ "content": "<|img_row_2_col_2|>",
3255
+ "lstrip": false,
3256
+ "normalized": false,
3257
+ "rstrip": false,
3258
+ "single_word": false,
3259
+ "special": true
3260
+ },
3261
+ "409": {
3262
+ "content": "<|img_row_2_col_3|>",
3263
+ "lstrip": false,
3264
+ "normalized": false,
3265
+ "rstrip": false,
3266
+ "single_word": false,
3267
+ "special": true
3268
+ },
3269
+ "410": {
3270
+ "content": "<|img_row_2_col_4|>",
3271
+ "lstrip": false,
3272
+ "normalized": false,
3273
+ "rstrip": false,
3274
+ "single_word": false,
3275
+ "special": true
3276
+ },
3277
+ "411": {
3278
+ "content": "<|img_row_2_col_5|>",
3279
+ "lstrip": false,
3280
+ "normalized": false,
3281
+ "rstrip": false,
3282
+ "single_word": false,
3283
+ "special": true
3284
+ },
3285
+ "412": {
3286
+ "content": "<|img_row_2_col_6|>",
3287
+ "lstrip": false,
3288
+ "normalized": false,
3289
+ "rstrip": false,
3290
+ "single_word": false,
3291
+ "special": true
3292
+ },
3293
+ "413": {
3294
+ "content": "<|img_row_2_col_7|>",
3295
+ "lstrip": false,
3296
+ "normalized": false,
3297
+ "rstrip": false,
3298
+ "single_word": false,
3299
+ "special": true
3300
+ },
3301
+ "414": {
3302
+ "content": "<|img_row_2_col_8|>",
3303
+ "lstrip": false,
3304
+ "normalized": false,
3305
+ "rstrip": false,
3306
+ "single_word": false,
3307
+ "special": true
3308
+ },
3309
+ "415": {
3310
+ "content": "<|img_row_2_col_9|>",
3311
+ "lstrip": false,
3312
+ "normalized": false,
3313
+ "rstrip": false,
3314
+ "single_word": false,
3315
+ "special": true
3316
+ },
3317
+ "416": {
3318
+ "content": "<|img_row_2_col_10|>",
3319
+ "lstrip": false,
3320
+ "normalized": false,
3321
+ "rstrip": false,
3322
+ "single_word": false,
3323
+ "special": true
3324
+ },
3325
+ "417": {
3326
+ "content": "<|img_row_3_col_1|>",
3327
+ "lstrip": false,
3328
+ "normalized": false,
3329
+ "rstrip": false,
3330
+ "single_word": false,
3331
+ "special": true
3332
+ },
3333
+ "418": {
3334
+ "content": "<|img_row_3_col_2|>",
3335
+ "lstrip": false,
3336
+ "normalized": false,
3337
+ "rstrip": false,
3338
+ "single_word": false,
3339
+ "special": true
3340
+ },
3341
+ "419": {
3342
+ "content": "<|img_row_3_col_3|>",
3343
+ "lstrip": false,
3344
+ "normalized": false,
3345
+ "rstrip": false,
3346
+ "single_word": false,
3347
+ "special": true
3348
+ },
3349
+ "420": {
3350
+ "content": "<|img_row_3_col_4|>",
3351
+ "lstrip": false,
3352
+ "normalized": false,
3353
+ "rstrip": false,
3354
+ "single_word": false,
3355
+ "special": true
3356
+ },
3357
+ "421": {
3358
+ "content": "<|img_row_3_col_5|>",
3359
+ "lstrip": false,
3360
+ "normalized": false,
3361
+ "rstrip": false,
3362
+ "single_word": false,
3363
+ "special": true
3364
+ },
3365
+ "422": {
3366
+ "content": "<|img_row_3_col_6|>",
3367
+ "lstrip": false,
3368
+ "normalized": false,
3369
+ "rstrip": false,
3370
+ "single_word": false,
3371
+ "special": true
3372
+ },
3373
+ "423": {
3374
+ "content": "<|img_row_3_col_7|>",
3375
+ "lstrip": false,
3376
+ "normalized": false,
3377
+ "rstrip": false,
3378
+ "single_word": false,
3379
+ "special": true
3380
+ },
3381
+ "424": {
3382
+ "content": "<|img_row_3_col_8|>",
3383
+ "lstrip": false,
3384
+ "normalized": false,
3385
+ "rstrip": false,
3386
+ "single_word": false,
3387
+ "special": true
3388
+ },
3389
+ "425": {
3390
+ "content": "<|img_row_3_col_9|>",
3391
+ "lstrip": false,
3392
+ "normalized": false,
3393
+ "rstrip": false,
3394
+ "single_word": false,
3395
+ "special": true
3396
+ },
3397
+ "426": {
3398
+ "content": "<|img_row_3_col_10|>",
3399
+ "lstrip": false,
3400
+ "normalized": false,
3401
+ "rstrip": false,
3402
+ "single_word": false,
3403
+ "special": true
3404
+ },
3405
+ "427": {
3406
+ "content": "<|img_row_4_col_1|>",
3407
+ "lstrip": false,
3408
+ "normalized": false,
3409
+ "rstrip": false,
3410
+ "single_word": false,
3411
+ "special": true
3412
+ },
3413
+ "428": {
3414
+ "content": "<|img_row_4_col_2|>",
3415
+ "lstrip": false,
3416
+ "normalized": false,
3417
+ "rstrip": false,
3418
+ "single_word": false,
3419
+ "special": true
3420
+ },
3421
+ "429": {
3422
+ "content": "<|img_row_4_col_3|>",
3423
+ "lstrip": false,
3424
+ "normalized": false,
3425
+ "rstrip": false,
3426
+ "single_word": false,
3427
+ "special": true
3428
+ },
3429
+ "430": {
3430
+ "content": "<|img_row_4_col_4|>",
3431
+ "lstrip": false,
3432
+ "normalized": false,
3433
+ "rstrip": false,
3434
+ "single_word": false,
3435
+ "special": true
3436
+ },
3437
+ "431": {
3438
+ "content": "<|img_row_4_col_5|>",
3439
+ "lstrip": false,
3440
+ "normalized": false,
3441
+ "rstrip": false,
3442
+ "single_word": false,
3443
+ "special": true
3444
+ },
3445
+ "432": {
3446
+ "content": "<|img_row_4_col_6|>",
3447
+ "lstrip": false,
3448
+ "normalized": false,
3449
+ "rstrip": false,
3450
+ "single_word": false,
3451
+ "special": true
3452
+ },
3453
+ "433": {
3454
+ "content": "<|img_row_4_col_7|>",
3455
+ "lstrip": false,
3456
+ "normalized": false,
3457
+ "rstrip": false,
3458
+ "single_word": false,
3459
+ "special": true
3460
+ },
3461
+ "434": {
3462
+ "content": "<|img_row_4_col_8|>",
3463
+ "lstrip": false,
3464
+ "normalized": false,
3465
+ "rstrip": false,
3466
+ "single_word": false,
3467
+ "special": true
3468
+ },
3469
+ "435": {
3470
+ "content": "<|img_row_4_col_9|>",
3471
+ "lstrip": false,
3472
+ "normalized": false,
3473
+ "rstrip": false,
3474
+ "single_word": false,
3475
+ "special": true
3476
+ },
3477
+ "436": {
3478
+ "content": "<|img_row_4_col_10|>",
3479
+ "lstrip": false,
3480
+ "normalized": false,
3481
+ "rstrip": false,
3482
+ "single_word": false,
3483
+ "special": true
3484
+ },
3485
+ "437": {
3486
+ "content": "<|img_row_5_col_1|>",
3487
+ "lstrip": false,
3488
+ "normalized": false,
3489
+ "rstrip": false,
3490
+ "single_word": false,
3491
+ "special": true
3492
+ },
3493
+ "438": {
3494
+ "content": "<|img_row_5_col_2|>",
3495
+ "lstrip": false,
3496
+ "normalized": false,
3497
+ "rstrip": false,
3498
+ "single_word": false,
3499
+ "special": true
3500
+ },
3501
+ "439": {
3502
+ "content": "<|img_row_5_col_3|>",
3503
+ "lstrip": false,
3504
+ "normalized": false,
3505
+ "rstrip": false,
3506
+ "single_word": false,
3507
+ "special": true
3508
+ },
3509
+ "440": {
3510
+ "content": "<|img_row_5_col_4|>",
3511
+ "lstrip": false,
3512
+ "normalized": false,
3513
+ "rstrip": false,
3514
+ "single_word": false,
3515
+ "special": true
3516
+ },
3517
+ "441": {
3518
+ "content": "<|img_row_5_col_5|>",
3519
+ "lstrip": false,
3520
+ "normalized": false,
3521
+ "rstrip": false,
3522
+ "single_word": false,
3523
+ "special": true
3524
+ },
3525
+ "442": {
3526
+ "content": "<|img_row_5_col_6|>",
3527
+ "lstrip": false,
3528
+ "normalized": false,
3529
+ "rstrip": false,
3530
+ "single_word": false,
3531
+ "special": true
3532
+ },
3533
+ "443": {
3534
+ "content": "<|img_row_5_col_7|>",
3535
+ "lstrip": false,
3536
+ "normalized": false,
3537
+ "rstrip": false,
3538
+ "single_word": false,
3539
+ "special": true
3540
+ },
3541
+ "444": {
3542
+ "content": "<|img_row_5_col_8|>",
3543
+ "lstrip": false,
3544
+ "normalized": false,
3545
+ "rstrip": false,
3546
+ "single_word": false,
3547
+ "special": true
3548
+ },
3549
+ "445": {
3550
+ "content": "<|img_row_5_col_9|>",
3551
+ "lstrip": false,
3552
+ "normalized": false,
3553
+ "rstrip": false,
3554
+ "single_word": false,
3555
+ "special": true
3556
+ },
3557
+ "446": {
3558
+ "content": "<|img_row_5_col_10|>",
3559
+ "lstrip": false,
3560
+ "normalized": false,
3561
+ "rstrip": false,
3562
+ "single_word": false,
3563
+ "special": true
3564
+ },
3565
+ "447": {
3566
+ "content": "<|img_row_6_col_1|>",
3567
+ "lstrip": false,
3568
+ "normalized": false,
3569
+ "rstrip": false,
3570
+ "single_word": false,
3571
+ "special": true
3572
+ },
3573
+ "448": {
3574
+ "content": "<|img_row_6_col_2|>",
3575
+ "lstrip": false,
3576
+ "normalized": false,
3577
+ "rstrip": false,
3578
+ "single_word": false,
3579
+ "special": true
3580
+ },
3581
+ "449": {
3582
+ "content": "<|img_row_6_col_3|>",
3583
+ "lstrip": false,
3584
+ "normalized": false,
3585
+ "rstrip": false,
3586
+ "single_word": false,
3587
+ "special": true
3588
+ },
3589
+ "450": {
3590
+ "content": "<|img_row_6_col_4|>",
3591
+ "lstrip": false,
3592
+ "normalized": false,
3593
+ "rstrip": false,
3594
+ "single_word": false,
3595
+ "special": true
3596
+ },
3597
+ "451": {
3598
+ "content": "<|img_row_6_col_5|>",
3599
+ "lstrip": false,
3600
+ "normalized": false,
3601
+ "rstrip": false,
3602
+ "single_word": false,
3603
+ "special": true
3604
+ },
3605
+ "452": {
3606
+ "content": "<|img_row_6_col_6|>",
3607
+ "lstrip": false,
3608
+ "normalized": false,
3609
+ "rstrip": false,
3610
+ "single_word": false,
3611
+ "special": true
3612
+ },
3613
+ "453": {
3614
+ "content": "<|img_row_6_col_7|>",
3615
+ "lstrip": false,
3616
+ "normalized": false,
3617
+ "rstrip": false,
3618
+ "single_word": false,
3619
+ "special": true
3620
+ },
3621
+ "454": {
3622
+ "content": "<|img_row_6_col_8|>",
3623
+ "lstrip": false,
3624
+ "normalized": false,
3625
+ "rstrip": false,
3626
+ "single_word": false,
3627
+ "special": true
3628
+ },
3629
+ "455": {
3630
+ "content": "<|img_row_6_col_9|>",
3631
+ "lstrip": false,
3632
+ "normalized": false,
3633
+ "rstrip": false,
3634
+ "single_word": false,
3635
+ "special": true
3636
+ },
3637
+ "456": {
3638
+ "content": "<|img_row_6_col_10|>",
3639
+ "lstrip": false,
3640
+ "normalized": false,
3641
+ "rstrip": false,
3642
+ "single_word": false,
3643
+ "special": true
3644
+ },
3645
+ "457": {
3646
+ "content": "<|img_row_7_col_1|>",
3647
+ "lstrip": false,
3648
+ "normalized": false,
3649
+ "rstrip": false,
3650
+ "single_word": false,
3651
+ "special": true
3652
+ },
3653
+ "458": {
3654
+ "content": "<|img_row_7_col_2|>",
3655
+ "lstrip": false,
3656
+ "normalized": false,
3657
+ "rstrip": false,
3658
+ "single_word": false,
3659
+ "special": true
3660
+ },
3661
+ "459": {
3662
+ "content": "<|img_row_7_col_3|>",
3663
+ "lstrip": false,
3664
+ "normalized": false,
3665
+ "rstrip": false,
3666
+ "single_word": false,
3667
+ "special": true
3668
+ },
3669
+ "460": {
3670
+ "content": "<|img_row_7_col_4|>",
3671
+ "lstrip": false,
3672
+ "normalized": false,
3673
+ "rstrip": false,
3674
+ "single_word": false,
3675
+ "special": true
3676
+ },
3677
+ "461": {
3678
+ "content": "<|img_row_7_col_5|>",
3679
+ "lstrip": false,
3680
+ "normalized": false,
3681
+ "rstrip": false,
3682
+ "single_word": false,
3683
+ "special": true
3684
+ },
3685
+ "462": {
3686
+ "content": "<|img_row_7_col_6|>",
3687
+ "lstrip": false,
3688
+ "normalized": false,
3689
+ "rstrip": false,
3690
+ "single_word": false,
3691
+ "special": true
3692
+ },
3693
+ "463": {
3694
+ "content": "<|img_row_7_col_7|>",
3695
+ "lstrip": false,
3696
+ "normalized": false,
3697
+ "rstrip": false,
3698
+ "single_word": false,
3699
+ "special": true
3700
+ },
3701
+ "464": {
3702
+ "content": "<|img_row_7_col_8|>",
3703
+ "lstrip": false,
3704
+ "normalized": false,
3705
+ "rstrip": false,
3706
+ "single_word": false,
3707
+ "special": true
3708
+ },
3709
+ "465": {
3710
+ "content": "<|img_row_7_col_9|>",
3711
+ "lstrip": false,
3712
+ "normalized": false,
3713
+ "rstrip": false,
3714
+ "single_word": false,
3715
+ "special": true
3716
+ },
3717
+ "466": {
3718
+ "content": "<|img_row_7_col_10|>",
3719
+ "lstrip": false,
3720
+ "normalized": false,
3721
+ "rstrip": false,
3722
+ "single_word": false,
3723
+ "special": true
3724
+ },
3725
+ "467": {
3726
+ "content": "<|img_row_8_col_1|>",
3727
+ "lstrip": false,
3728
+ "normalized": false,
3729
+ "rstrip": false,
3730
+ "single_word": false,
3731
+ "special": true
3732
+ },
3733
+ "468": {
3734
+ "content": "<|img_row_8_col_2|>",
3735
+ "lstrip": false,
3736
+ "normalized": false,
3737
+ "rstrip": false,
3738
+ "single_word": false,
3739
+ "special": true
3740
+ },
3741
+ "469": {
3742
+ "content": "<|img_row_8_col_3|>",
3743
+ "lstrip": false,
3744
+ "normalized": false,
3745
+ "rstrip": false,
3746
+ "single_word": false,
3747
+ "special": true
3748
+ },
3749
+ "470": {
3750
+ "content": "<|img_row_8_col_4|>",
3751
+ "lstrip": false,
3752
+ "normalized": false,
3753
+ "rstrip": false,
3754
+ "single_word": false,
3755
+ "special": true
3756
+ },
3757
+ "471": {
3758
+ "content": "<|img_row_8_col_5|>",
3759
+ "lstrip": false,
3760
+ "normalized": false,
3761
+ "rstrip": false,
3762
+ "single_word": false,
3763
+ "special": true
3764
+ },
3765
+ "472": {
3766
+ "content": "<|img_row_8_col_6|>",
3767
+ "lstrip": false,
3768
+ "normalized": false,
3769
+ "rstrip": false,
3770
+ "single_word": false,
3771
+ "special": true
3772
+ },
3773
+ "473": {
3774
+ "content": "<|img_row_8_col_7|>",
3775
+ "lstrip": false,
3776
+ "normalized": false,
3777
+ "rstrip": false,
3778
+ "single_word": false,
3779
+ "special": true
3780
+ },
3781
+ "474": {
3782
+ "content": "<|img_row_8_col_8|>",
3783
+ "lstrip": false,
3784
+ "normalized": false,
3785
+ "rstrip": false,
3786
+ "single_word": false,
3787
+ "special": true
3788
+ },
3789
+ "475": {
3790
+ "content": "<|img_row_8_col_9|>",
3791
+ "lstrip": false,
3792
+ "normalized": false,
3793
+ "rstrip": false,
3794
+ "single_word": false,
3795
+ "special": true
3796
+ },
3797
+ "476": {
3798
+ "content": "<|img_row_8_col_10|>",
3799
+ "lstrip": false,
3800
+ "normalized": false,
3801
+ "rstrip": false,
3802
+ "single_word": false,
3803
+ "special": true
3804
+ },
3805
+ "477": {
3806
+ "content": "<|img_row_9_col_1|>",
3807
+ "lstrip": false,
3808
+ "normalized": false,
3809
+ "rstrip": false,
3810
+ "single_word": false,
3811
+ "special": true
3812
+ },
3813
+ "478": {
3814
+ "content": "<|img_row_9_col_2|>",
3815
+ "lstrip": false,
3816
+ "normalized": false,
3817
+ "rstrip": false,
3818
+ "single_word": false,
3819
+ "special": true
3820
+ },
3821
+ "479": {
3822
+ "content": "<|img_row_9_col_3|>",
3823
+ "lstrip": false,
3824
+ "normalized": false,
3825
+ "rstrip": false,
3826
+ "single_word": false,
3827
+ "special": true
3828
+ },
3829
+ "480": {
3830
+ "content": "<|img_row_9_col_4|>",
3831
+ "lstrip": false,
3832
+ "normalized": false,
3833
+ "rstrip": false,
3834
+ "single_word": false,
3835
+ "special": true
3836
+ },
3837
+ "481": {
3838
+ "content": "<|img_row_9_col_5|>",
3839
+ "lstrip": false,
3840
+ "normalized": false,
3841
+ "rstrip": false,
3842
+ "single_word": false,
3843
+ "special": true
3844
+ },
3845
+ "482": {
3846
+ "content": "<|img_row_9_col_6|>",
3847
+ "lstrip": false,
3848
+ "normalized": false,
3849
+ "rstrip": false,
3850
+ "single_word": false,
3851
+ "special": true
3852
+ },
3853
+ "483": {
3854
+ "content": "<|img_row_9_col_7|>",
3855
+ "lstrip": false,
3856
+ "normalized": false,
3857
+ "rstrip": false,
3858
+ "single_word": false,
3859
+ "special": true
3860
+ },
3861
+ "484": {
3862
+ "content": "<|img_row_9_col_8|>",
3863
+ "lstrip": false,
3864
+ "normalized": false,
3865
+ "rstrip": false,
3866
+ "single_word": false,
3867
+ "special": true
3868
+ },
3869
+ "485": {
3870
+ "content": "<|img_row_9_col_9|>",
3871
+ "lstrip": false,
3872
+ "normalized": false,
3873
+ "rstrip": false,
3874
+ "single_word": false,
3875
+ "special": true
3876
+ },
3877
+ "486": {
3878
+ "content": "<|img_row_9_col_10|>",
3879
+ "lstrip": false,
3880
+ "normalized": false,
3881
+ "rstrip": false,
3882
+ "single_word": false,
3883
+ "special": true
3884
+ },
3885
+ "487": {
3886
+ "content": "<|img_row_10_col_1|>",
3887
+ "lstrip": false,
3888
+ "normalized": false,
3889
+ "rstrip": false,
3890
+ "single_word": false,
3891
+ "special": true
3892
+ },
3893
+ "488": {
3894
+ "content": "<|img_row_10_col_2|>",
3895
+ "lstrip": false,
3896
+ "normalized": false,
3897
+ "rstrip": false,
3898
+ "single_word": false,
3899
+ "special": true
3900
+ },
3901
+ "489": {
3902
+ "content": "<|img_row_10_col_3|>",
3903
+ "lstrip": false,
3904
+ "normalized": false,
3905
+ "rstrip": false,
3906
+ "single_word": false,
3907
+ "special": true
3908
+ },
3909
+ "490": {
3910
+ "content": "<|img_row_10_col_4|>",
3911
+ "lstrip": false,
3912
+ "normalized": false,
3913
+ "rstrip": false,
3914
+ "single_word": false,
3915
+ "special": true
3916
+ },
3917
+ "491": {
3918
+ "content": "<|img_row_10_col_5|>",
3919
+ "lstrip": false,
3920
+ "normalized": false,
3921
+ "rstrip": false,
3922
+ "single_word": false,
3923
+ "special": true
3924
+ },
3925
+ "492": {
3926
+ "content": "<|img_row_10_col_6|>",
3927
+ "lstrip": false,
3928
+ "normalized": false,
3929
+ "rstrip": false,
3930
+ "single_word": false,
3931
+ "special": true
3932
+ },
3933
+ "493": {
3934
+ "content": "<|img_row_10_col_7|>",
3935
+ "lstrip": false,
3936
+ "normalized": false,
3937
+ "rstrip": false,
3938
+ "single_word": false,
3939
+ "special": true
3940
+ },
3941
+ "494": {
3942
+ "content": "<|img_row_10_col_8|>",
3943
+ "lstrip": false,
3944
+ "normalized": false,
3945
+ "rstrip": false,
3946
+ "single_word": false,
3947
+ "special": true
3948
+ },
3949
+ "495": {
3950
+ "content": "<|img_row_10_col_9|>",
3951
+ "lstrip": false,
3952
+ "normalized": false,
3953
+ "rstrip": false,
3954
+ "single_word": false,
3955
+ "special": true
3956
+ },
3957
+ "496": {
3958
+ "content": "<|img_row_10_col_10|>",
3959
+ "lstrip": false,
3960
+ "normalized": false,
3961
+ "rstrip": false,
3962
+ "single_word": false,
3963
+ "special": true
3964
+ },
3965
+ "497": {
3966
+ "content": "<|img_thumbnail|>",
3967
+ "lstrip": false,
3968
+ "normalized": false,
3969
+ "rstrip": false,
3970
+ "single_word": false,
3971
+ "special": true
3972
+ },
3973
+ "498": {
3974
+ "content": "<|image_start|>",
3975
+ "lstrip": false,
3976
+ "normalized": false,
3977
+ "rstrip": false,
3978
+ "single_word": false,
3979
+ "special": true
3980
+ },
3981
+ "499": {
3982
+ "content": "<|image_end|>",
3983
+ "lstrip": false,
3984
+ "normalized": false,
3985
+ "rstrip": false,
3986
+ "single_word": false,
3987
+ "special": true
3988
+ },
3989
+ "500": {
3990
+ "content": "<|image_split|>",
3991
+ "lstrip": false,
3992
+ "normalized": false,
3993
+ "rstrip": false,
3994
+ "single_word": false,
3995
+ "special": true
3996
+ },
3997
+ "64011": {
3998
+ "content": "Mathias",
3999
+ "lstrip": false,
4000
+ "normalized": true,
4001
+ "rstrip": false,
4002
+ "single_word": false,
4003
+ "special": false
4004
+ },
4005
+ "64014": {
4006
+ "content": "python",
4007
+ "lstrip": false,
4008
+ "normalized": true,
4009
+ "rstrip": false,
4010
+ "single_word": false,
4011
+ "special": false
4012
+ },
4013
+ "64394": {
4014
+ "content": "<|cot_start|>",
4015
+ "lstrip": false,
4016
+ "normalized": false,
4017
+ "rstrip": false,
4018
+ "single_word": false,
4019
+ "special": true
4020
+ },
4021
+ "64395": {
4022
+ "content": "<|cot_end|>",
4023
+ "lstrip": false,
4024
+ "normalized": false,
4025
+ "rstrip": false,
4026
+ "single_word": false,
4027
+ "special": true
4028
+ },
4029
+ "64396": {
4030
+ "content": "<|review_start|>",
4031
+ "lstrip": false,
4032
+ "normalized": false,
4033
+ "rstrip": false,
4034
+ "single_word": false,
4035
+ "special": true
4036
+ },
4037
+ "64397": {
4038
+ "content": "<|review_end|>",
4039
+ "lstrip": false,
4040
+ "normalized": false,
4041
+ "rstrip": false,
4042
+ "single_word": false,
4043
+ "special": true
4044
+ },
4045
+ "64398": {
4046
+ "content": "<|file_start|>",
4047
+ "lstrip": false,
4048
+ "normalized": false,
4049
+ "rstrip": false,
4050
+ "single_word": false,
4051
+ "special": true
4052
+ },
4053
+ "64399": {
4054
+ "content": "<|file_end|>",
4055
+ "lstrip": false,
4056
+ "normalized": false,
4057
+ "rstrip": false,
4058
+ "single_word": false,
4059
+ "special": true
4060
+ }
4061
+ },
4062
+ "bos_token": "<|startoftext|>",
4063
+ "clean_up_tokenization_spaces": false,
4064
+ "eos_token": "<|im_end|>",
4065
+ "extra_special_tokens": {},
4066
+ "legacy": false,
4067
+ "model_input_names": [
4068
+ "input_ids",
4069
+ "attention_mask"
4070
+ ],
4071
+ "model_max_length": 1000000000000000019884624838656,
4072
+ "pad_token": "<|pad|>",
4073
+ "sp_model_kwargs": {},
4074
+ "spaces_between_special_tokens": false,
4075
+ "tokenizer_class": "PreTrainedTokenizerFast",
4076
+ "use_default_system_prompt": false,
4077
+ "use_fast": true
4078
+ }