riczhou commited on
Commit
4dd9b49
1 Parent(s): ac5b968

Initial commit

Browse files
logs.txt ADDED
@@ -0,0 +1,338 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0
  0%| | 0/171 [00:00<?, ?it/s]
1
 
 
2
  0%| | 0/171 [00:00<?, ?it/s]
3
 
 
4
  0%| | 0/171 [00:03<?, ?it/s]
5
 
 
6
  0%| | 0/171 [00:04<?, ?it/s]
7
 
 
8
  0%| | 0/171 [00:04<?, ?it/s]
9
  1%| | 1/171 [00:04<13:53, 4.90s/it]
10
 
 
11
  1%| | 1/171 [00:05<13:53, 4.90s/it]
12
 
 
13
  1%| | 1/171 [00:05<13:53, 4.90s/it]
14
  1%| | 2/171 [00:05<06:57, 2.47s/it]
15
 
 
16
  1%| | 2/171 [00:05<06:57, 2.47s/it]
17
 
 
18
  1%| | 2/171 [00:05<06:57, 2.47s/it]
19
 
 
20
  1%| | 2/171 [00:06<06:57, 2.47s/it]
21
 
 
22
  1%| | 2/171 [00:06<06:57, 2.47s/it]
23
  2%|▏ | 4/171 [00:06<02:59, 1.07s/it]
24
 
 
25
  2%|▏ | 4/171 [00:06<02:59, 1.07s/it]
26
 
 
27
  2%|▏ | 4/171 [00:06<02:59, 1.07s/it]
28
 
 
29
  2%|▏ | 4/171 [00:06<02:59, 1.07s/it]
30
  3%|▎ | 5/171 [00:06<02:28, 1.12it/s]
31
 
 
32
  3%|▎ | 5/171 [00:06<02:28, 1.12it/s]
33
 
 
34
  3%|▎ | 5/171 [00:06<02:28, 1.12it/s]
35
 
 
36
  3%|▎ | 5/171 [00:06<02:28, 1.12it/s]
37
 
 
38
  3%|▎ | 5/171 [00:07<02:28, 1.12it/s]
39
 
 
40
  3%|▎ | 5/171 [00:07<02:28, 1.12it/s]
41
  5%|▍ | 8/171 [00:07<01:17, 2.11it/s]
42
 
 
43
  5%|▍ | 8/171 [00:07<01:17, 2.11it/s]
44
 
 
45
  5%|▍ | 8/171 [00:07<01:17, 2.11it/s]
46
 
 
47
  5%|▍ | 8/171 [00:07<01:17, 2.11it/s]
48
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
49
 
 
50
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
51
 
 
52
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
53
 
 
54
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
55
 
 
56
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
57
 
 
58
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
59
 
 
60
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
61
 
 
62
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
63
 
 
64
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
65
 
 
66
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
67
 
 
68
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
69
 
 
70
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
71
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
72
 
 
73
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
74
 
 
75
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
76
 
 
77
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
78
 
 
79
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
80
 
 
81
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
82
 
 
83
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
84
 
 
85
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
86
 
 
87
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
88
 
 
89
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
90
 
 
91
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
92
 
 
93
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
94
 
 
95
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
96
 
 
97
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
98
 
 
99
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
100
 
 
101
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
102
 
 
103
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
104
 
 
105
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
106
 
 
107
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
108
 
 
109
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
110
 
 
111
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
112
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
113
 
 
114
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
115
 
 
116
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
117
 
 
118
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
119
 
 
120
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
121
 
 
122
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
123
 
 
124
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
125
 
 
126
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
127
 
 
128
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
129
 
 
130
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
131
 
 
132
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
133
 
 
134
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
135
 
 
136
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
137
 
 
138
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
139
 
 
140
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
141
 
 
142
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
143
 
 
144
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
145
 
 
146
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
147
 
 
148
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
149
 
 
150
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
151
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
152
 
 
153
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
154
 
 
155
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
156
 
 
157
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
158
 
 
159
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
160
 
 
161
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
162
 
 
163
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
164
 
 
165
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
166
 
 
167
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
168
 
 
169
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
170
 
 
171
  24%|██▍ | 41/171 [00:08<00:04, 26.11it/s]
172
 
 
173
  24%|██▍ | 41/171 [00:08<00:04, 26.11it/s]
174
 
 
175
  24%|██▍ | 41/171 [00:08<00:04, 26.11it/s]
176
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
177
 
 
178
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
179
 
 
180
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
181
 
 
182
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
183
 
 
184
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
185
 
 
186
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
187
 
 
188
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
189
 
 
190
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
191
 
 
192
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
193
 
 
194
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
195
 
 
196
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
197
 
 
198
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
199
 
 
200
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
201
 
 
202
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
203
 
 
204
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
205
 
 
206
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
207
 
 
208
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
209
 
 
210
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
211
 
 
212
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
213
 
 
214
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
215
 
 
216
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
217
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
218
 
 
219
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
220
 
 
221
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
222
 
 
223
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
224
 
 
225
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
226
 
 
227
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
228
 
 
229
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
230
 
 
231
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
232
 
 
233
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
234
 
 
235
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
236
 
 
237
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
238
 
 
239
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
240
 
 
241
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
242
 
 
243
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
244
 
 
245
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
246
 
 
247
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
248
 
 
249
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
250
 
 
251
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
252
 
 
253
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
254
 
 
255
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
256
 
 
257
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
258
 
 
259
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
260
 
 
261
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
262
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
263
 
 
264
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
265
 
 
266
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
267
 
 
268
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
269
 
 
270
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
271
 
 
272
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
273
 
 
274
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
275
 
 
276
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
277
 
 
278
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
279
 
 
280
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
281
 
 
282
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
283
 
 
284
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
285
 
 
286
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
287
 
 
288
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
289
 
 
290
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
291
 
 
292
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
293
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
294
 
 
295
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
296
 
 
297
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
298
 
 
299
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
300
 
 
301
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
302
 
 
303
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
304
 
 
305
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
306
 
 
307
  50%|���███▉ | 85/171 [00:08<00:01, 61.64it/s]
308
 
 
309
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
310
 
 
311
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
312
 
 
313
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
314
 
 
315
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
316
 
 
317
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
318
 
 
319
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
320
 
 
321
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
322
 
 
323
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
324
 
 
325
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
326
 
 
327
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
328
 
 
329
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
330
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
331
 
 
332
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
333
 
 
334
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
335
 
 
336
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
337
 
 
338
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
339
 
 
340
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
341
 
 
342
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
343
 
 
344
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
345
 
 
346
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
347
 
 
348
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
349
 
 
350
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
351
 
 
352
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
353
 
 
354
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
355
 
 
356
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
357
 
 
358
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
359
 
 
360
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
361
 
 
362
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
363
 
 
364
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
365
 
 
366
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
367
 
 
368
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
369
 
 
370
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
371
 
 
372
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
373
 
 
374
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
375
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
376
 
 
377
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
378
 
 
379
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
380
 
 
381
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
382
 
 
383
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
384
 
 
385
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
386
 
 
387
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
388
 
 
389
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
390
 
 
391
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
392
 
 
393
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
394
 
 
395
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
396
 
 
397
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
398
 
 
399
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
400
 
 
401
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
402
 
 
403
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
404
 
 
405
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
406
 
 
407
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
408
 
 
409
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
410
 
 
411
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
412
 
 
413
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
414
 
 
415
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
416
 
 
417
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
418
 
 
419
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
420
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
421
 
 
422
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
423
 
 
424
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
425
 
 
426
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
427
 
 
428
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
429
 
 
430
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
431
 
 
432
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
433
 
 
434
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
435
 
 
436
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
437
 
 
438
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
439
 
 
440
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
441
 
 
442
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
443
 
 
444
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
445
 
 
446
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
447
 
 
448
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
449
 
 
450
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
451
 
 
452
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
453
 
 
454
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
455
 
 
456
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
457
 
 
458
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
459
 
 
460
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
461
 
 
462
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
463
 
 
464
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
465
  81%|████████ | 138/171 [00:08<00:00, 94.74it/s]
466
 
 
467
  81%|████████ | 138/171 [00:08<00:00, 94.74it/s]
468
 
 
469
  81%|████████ | 138/171 [00:08<00:00, 94.74it/s]
470
 
 
471
  81%|████████ | 138/171 [00:08<00:00, 94.74it/s]
472
 
 
473
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
474
 
 
475
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
476
 
 
477
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
478
 
 
479
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
480
 
 
481
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
482
 
 
483
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
484
 
 
485
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
486
 
 
487
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
488
 
 
489
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
490
 
 
491
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
492
 
 
493
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
494
 
 
495
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
496
 
 
497
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
498
 
 
499
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
500
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
501
 
 
502
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
503
 
 
504
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
505
 
 
506
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
507
 
 
508
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
509
 
 
510
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
511
 
 
512
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
513
 
 
514
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
515
 
 
516
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
517
 
 
518
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
519
 
 
520
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
521
 
 
522
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
523
 
 
524
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
525
 
 
526
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
527
 
 
528
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
529
 
 
530
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
531
 
 
532
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
533
 
 
534
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
535
 
 
536
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
537
 
 
538
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
539
 
 
540
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
541
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
542
 
 
543
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
544
 
 
545
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
546
 
 
547
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
548
 
 
549
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
550
 
 
551
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
552
 
 
553
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
554
 
 
555
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
556
 
 
557
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
558
 
 
559
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
560
 
 
561
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
562
 
 
563
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
564
 
 
565
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
566
 
 
567
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
568
 
 
569
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
 
 
 
 
 
 
 
 
 
 
1
+ /opt/conda/envs/py310/bin/python -m mlc_llm gen_config /models/Qwen1.5-0.5B-Chat --quantization q4f16_1 --conv-template chatml --output /models/mlc-delivery/hf/mlc-ai/Qwen1.5-0.5B-Chat-q4f16_1-MLC
2
+ [2024-06-04 03:31:28] INFO auto_config.py:116: Found model configuration: /models/Qwen1.5-0.5B-Chat/config.json
3
+ [2024-06-04 03:31:28] INFO auto_config.py:154: Found model type: qwen2. Use `--model-type` to override.
4
+ [2024-06-04 03:31:28] INFO qwen2_model.py:49: context_window_size not found in config.json. Falling back to max_position_embeddings (32768)
5
+ [2024-06-04 03:31:28] INFO qwen2_model.py:66: prefill_chunk_size defaults to 2048
6
+ [2024-06-04 03:31:28] INFO config.py:107: Overriding max_batch_size from 1 to 80
7
+ [2024-06-04 03:31:28] INFO gen_config.py:143: [generation_config.json] Setting bos_token_id: 151643
8
+ [2024-06-04 03:31:28] INFO gen_config.py:143: [generation_config.json] Setting pad_token_id: 151643
9
+ [2024-06-04 03:31:28] INFO gen_config.py:143: [generation_config.json] Setting eos_token_id: [151645, 151643]
10
+ [2024-06-04 03:31:28] INFO gen_config.py:143: [generation_config.json] Setting repetition_penalty: 1.1
11
+ [2024-06-04 03:31:28] INFO gen_config.py:143: [generation_config.json] Setting top_p: 0.8
12
+ [2024-06-04 03:31:28] INFO gen_config.py:157: Not found tokenizer config: /models/Qwen1.5-0.5B-Chat/tokenizer.model
13
+ [2024-06-04 03:31:28] INFO gen_config.py:155: Found tokenizer config: /models/Qwen1.5-0.5B-Chat/tokenizer.json. Copying to /models/mlc-delivery/hf/mlc-ai/Qwen1.5-0.5B-Chat-q4f16_1-MLC/tokenizer.json
14
+ [2024-06-04 03:31:28] INFO gen_config.py:155: Found tokenizer config: /models/Qwen1.5-0.5B-Chat/vocab.json. Copying to /models/mlc-delivery/hf/mlc-ai/Qwen1.5-0.5B-Chat-q4f16_1-MLC/vocab.json
15
+ [2024-06-04 03:31:28] INFO gen_config.py:155: Found tokenizer config: /models/Qwen1.5-0.5B-Chat/merges.txt. Copying to /models/mlc-delivery/hf/mlc-ai/Qwen1.5-0.5B-Chat-q4f16_1-MLC/merges.txt
16
+ [2024-06-04 03:31:28] INFO gen_config.py:157: Not found tokenizer config: /models/Qwen1.5-0.5B-Chat/added_tokens.json
17
+ [2024-06-04 03:31:28] INFO gen_config.py:155: Found tokenizer config: /models/Qwen1.5-0.5B-Chat/tokenizer_config.json. Copying to /models/mlc-delivery/hf/mlc-ai/Qwen1.5-0.5B-Chat-q4f16_1-MLC/tokenizer_config.json
18
+ [2024-06-04 03:31:28] INFO gen_config.py:216: Detected tokenizer info: {'token_postproc_method': 'byte_level', 'prepend_space_in_encode': False, 'strip_space_in_decode': False}
19
+ [2024-06-04 03:31:28] INFO gen_config.py:32: [System default] Setting temperature: 1.0
20
+ [2024-06-04 03:31:28] INFO gen_config.py:32: [System default] Setting presence_penalty: 0.0
21
+ [2024-06-04 03:31:28] INFO gen_config.py:32: [System default] Setting frequency_penalty: 0.0
22
+ [2024-06-04 03:31:28] INFO gen_config.py:32: [System default] Setting mean_gen_len: 128
23
+ [2024-06-04 03:31:28] INFO gen_config.py:32: [System default] Setting max_gen_len: 512
24
+ [2024-06-04 03:31:28] INFO gen_config.py:32: [System default] Setting shift_fill_factor: 0.3
25
+ [2024-06-04 03:31:28] INFO gen_config.py:223: Dumping configuration file to: /models/mlc-delivery/hf/mlc-ai/Qwen1.5-0.5B-Chat-q4f16_1-MLC/mlc-chat-config.json
26
+ /opt/conda/envs/py310/bin/python -m mlc_llm convert_weight /models/Qwen1.5-0.5B-Chat --quantization q4f16_1 --output /models/mlc-delivery/hf/mlc-ai/Qwen1.5-0.5B-Chat-q4f16_1-MLC
27
+ [2024-06-04 03:31:30] INFO auto_config.py:116: Found model configuration: /models/Qwen1.5-0.5B-Chat/config.json
28
+ [2024-06-04 03:31:31] INFO auto_device.py:79: Found device: cuda:0
29
+ [2024-06-04 03:31:33] INFO auto_device.py:88: Not found device: rocm:0
30
+ [2024-06-04 03:31:34] INFO auto_device.py:88: Not found device: metal:0
31
+ [2024-06-04 03:31:36] INFO auto_device.py:79: Found device: vulkan:0
32
+ [2024-06-04 03:31:36] INFO auto_device.py:79: Found device: vulkan:1
33
+ [2024-06-04 03:31:36] INFO auto_device.py:79: Found device: vulkan:2
34
+ [2024-06-04 03:31:36] INFO auto_device.py:79: Found device: vulkan:3
35
+ [2024-06-04 03:31:37] INFO auto_device.py:88: Not found device: opencl:0
36
+ [2024-06-04 03:31:37] INFO auto_device.py:35: Using device: cuda:0
37
+ [2024-06-04 03:31:37] INFO auto_weight.py:71: Finding weights in: /models/Qwen1.5-0.5B-Chat
38
+ [2024-06-04 03:31:37] INFO auto_weight.py:137: Not found Huggingface PyTorch
39
+ [2024-06-04 03:31:37] INFO auto_weight.py:144: Found source weight format: huggingface-safetensor. Source configuration: /models/Qwen1.5-0.5B-Chat/model.safetensors.index.json
40
+ [2024-06-04 03:31:37] INFO auto_weight.py:107: Using source weight configuration: /models/Qwen1.5-0.5B-Chat/model.safetensors.index.json. Use `--source` to override.
41
+ [2024-06-04 03:31:37] INFO auto_weight.py:111: Using source weight format: huggingface-safetensor. Use `--source-format` to override.
42
+ [2024-06-04 03:31:37] INFO auto_config.py:154: Found model type: qwen2. Use `--model-type` to override.
43
+ [2024-06-04 03:31:37] INFO qwen2_model.py:49: context_window_size not found in config.json. Falling back to max_position_embeddings (32768)
44
+ [2024-06-04 03:31:37] INFO qwen2_model.py:66: prefill_chunk_size defaults to 2048
45
+ Weight conversion with arguments:
46
+ --config /models/Qwen1.5-0.5B-Chat/config.json
47
+ --quantization GroupQuantize(name='q4f16_1', kind='group-quant', group_size=32, quantize_dtype='int4', storage_dtype='uint32', model_dtype='float16', linear_weight_layout='NK', quantize_embedding=True, quantize_final_fc=True, num_elem_per_storage=8, num_storage_per_group=4, max_int_value=7)
48
+ --model-type qwen2
49
+ --device cuda:0
50
+ --source /models/Qwen1.5-0.5B-Chat/model.safetensors.index.json
51
+ --source-format huggingface-safetensor
52
+ --output /models/mlc-delivery/hf/mlc-ai/Qwen1.5-0.5B-Chat-q4f16_1-MLC
53
+ Start storing to cache /models/mlc-delivery/hf/mlc-ai/Qwen1.5-0.5B-Chat-q4f16_1-MLC
54
+
55
  0%| | 0/171 [00:00<?, ?it/s]
56
 
57
+
58
  0%| | 0/171 [00:00<?, ?it/s]
59
 
60
+
61
  0%| | 0/171 [00:03<?, ?it/s]
62
 
63
+
64
  0%| | 0/171 [00:04<?, ?it/s]
65
 
66
+
67
  0%| | 0/171 [00:04<?, ?it/s]
68
  1%| | 1/171 [00:04<13:53, 4.90s/it]
69
 
70
+
71
  1%| | 1/171 [00:05<13:53, 4.90s/it]
72
 
73
+
74
  1%| | 1/171 [00:05<13:53, 4.90s/it]
75
  1%| | 2/171 [00:05<06:57, 2.47s/it]
76
 
77
+
78
  1%| | 2/171 [00:05<06:57, 2.47s/it]
79
 
80
+
81
  1%| | 2/171 [00:05<06:57, 2.47s/it]
82
 
83
+
84
  1%| | 2/171 [00:06<06:57, 2.47s/it]
85
 
86
+
87
  1%| | 2/171 [00:06<06:57, 2.47s/it]
88
  2%|▏ | 4/171 [00:06<02:59, 1.07s/it]
89
 
90
+
91
  2%|▏ | 4/171 [00:06<02:59, 1.07s/it]
92
 
93
+
94
  2%|▏ | 4/171 [00:06<02:59, 1.07s/it]
95
 
96
+
97
  2%|▏ | 4/171 [00:06<02:59, 1.07s/it]
98
  3%|▎ | 5/171 [00:06<02:28, 1.12it/s]
99
 
100
+
101
  3%|▎ | 5/171 [00:06<02:28, 1.12it/s]
102
 
103
+
104
  3%|▎ | 5/171 [00:06<02:28, 1.12it/s]
105
 
106
+
107
  3%|▎ | 5/171 [00:06<02:28, 1.12it/s]
108
 
109
+
110
  3%|▎ | 5/171 [00:07<02:28, 1.12it/s]
111
 
112
+
113
  3%|▎ | 5/171 [00:07<02:28, 1.12it/s]
114
  5%|▍ | 8/171 [00:07<01:17, 2.11it/s]
115
 
116
+
117
  5%|▍ | 8/171 [00:07<01:17, 2.11it/s]
118
 
119
+
120
  5%|▍ | 8/171 [00:07<01:17, 2.11it/s]
121
 
122
+
123
  5%|▍ | 8/171 [00:07<01:17, 2.11it/s]
124
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
125
 
126
+
127
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
128
 
129
+
130
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
131
 
132
+
133
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
134
 
135
+
136
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
137
 
138
+
139
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
140
 
141
+
142
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
143
 
144
+
145
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
146
 
147
+
148
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
149
 
150
+
151
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
152
 
153
+
154
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
155
 
156
+
157
  5%|▌ | 9/171 [00:07<01:16, 2.11it/s]
158
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
159
 
160
+
161
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
162
 
163
+
164
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
165
 
166
+
167
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
168
 
169
+
170
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
171
 
172
+
173
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
174
 
175
+
176
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
177
 
178
+
179
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
180
 
181
+
182
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
183
 
184
+
185
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
186
 
187
+
188
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
189
 
190
+
191
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
192
 
193
+
194
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
195
 
196
+
197
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
198
 
199
+
200
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
201
 
202
+
203
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
204
 
205
+
206
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
207
 
208
+
209
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
210
 
211
+
212
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
213
 
214
+
215
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
216
 
217
+
218
  9%|▉ | 16/171 [00:07<00:25, 6.11it/s]
219
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
220
 
221
+
222
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
223
 
224
+
225
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
226
 
227
+
228
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
229
 
230
+
231
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
232
 
233
+
234
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
235
 
236
+
237
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
238
 
239
+
240
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
241
 
242
+
243
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
244
 
245
+
246
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
247
 
248
+
249
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
250
 
251
+
252
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
253
 
254
+
255
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
256
 
257
+
258
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
259
 
260
+
261
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
262
 
263
+
264
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
265
 
266
+
267
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
268
 
269
+
270
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
271
 
272
+
273
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
274
 
275
+
276
  17%|█▋ | 29/171 [00:07<00:09, 15.69it/s]
277
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
278
 
279
+
280
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
281
 
282
+
283
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
284
 
285
+
286
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
287
 
288
+
289
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
290
 
291
+
292
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
293
 
294
+
295
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
296
 
297
+
298
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
299
 
300
+
301
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
302
 
303
+
304
  24%|██▍ | 41/171 [00:07<00:04, 26.11it/s]
305
 
306
+
307
  24%|██▍ | 41/171 [00:08<00:04, 26.11it/s]
308
 
309
+
310
  24%|██▍ | 41/171 [00:08<00:04, 26.11it/s]
311
 
312
+
313
  24%|██▍ | 41/171 [00:08<00:04, 26.11it/s]
314
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
315
 
316
+
317
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
318
 
319
+
320
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
321
 
322
+
323
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
324
 
325
+
326
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
327
 
328
+
329
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
330
 
331
+
332
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
333
 
334
+
335
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
336
 
337
+
338
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
339
 
340
+
341
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
342
 
343
+
344
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
345
 
346
+
347
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
348
 
349
+
350
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
351
 
352
+
353
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
354
 
355
+
356
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
357
 
358
+
359
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
360
 
361
+
362
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
363
 
364
+
365
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
366
 
367
+
368
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
369
 
370
+
371
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
372
 
373
+
374
  29%|██▊ | 49/171 [00:08<00:03, 32.06it/s]
375
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
376
 
377
+
378
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
379
 
380
+
381
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
382
 
383
+
384
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
385
 
386
+
387
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
388
 
389
+
390
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
391
 
392
+
393
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
394
 
395
+
396
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
397
 
398
+
399
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
400
 
401
+
402
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
403
 
404
+
405
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
406
 
407
+
408
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
409
 
410
+
411
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
412
 
413
+
414
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
415
 
416
+
417
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
418
 
419
+
420
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
421
 
422
+
423
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
424
 
425
+
426
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
427
 
428
+
429
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
430
 
431
+
432
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
433
 
434
+
435
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
436
 
437
+
438
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
439
 
440
+
441
  36%|███▌ | 61/171 [00:08<00:02, 43.84it/s]
442
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
443
 
444
+
445
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
446
 
447
+
448
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
449
 
450
+
451
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
452
 
453
+
454
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
455
 
456
+
457
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
458
 
459
+
460
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
461
 
462
+
463
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
464
 
465
+
466
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
467
 
468
+
469
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
470
 
471
+
472
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
473
 
474
+
475
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
476
 
477
+
478
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
479
 
480
+
481
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
482
 
483
+
484
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
485
 
486
+
487
  44%|████▍ | 75/171 [00:08<00:01, 58.43it/s]
488
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
489
 
490
+
491
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
492
 
493
+
494
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
495
 
496
+
497
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
498
 
499
+
500
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
501
 
502
+
503
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
504
 
505
+
506
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
507
 
508
+
509
  50%|���███▉ | 85/171 [00:08<00:01, 61.64it/s]
510
 
511
+
512
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
513
 
514
+
515
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
516
 
517
+
518
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
519
 
520
+
521
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
522
 
523
+
524
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
525
 
526
+
527
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
528
 
529
+
530
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
531
 
532
+
533
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
534
 
535
+
536
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
537
 
538
+
539
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
540
 
541
+
542
  50%|████▉ | 85/171 [00:08<00:01, 61.64it/s]
543
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
544
 
545
+
546
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
547
 
548
+
549
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
550
 
551
+
552
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
553
 
554
+
555
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
556
 
557
+
558
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
559
 
560
+
561
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
562
 
563
+
564
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
565
 
566
+
567
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
568
 
569
+
570
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
571
 
572
+
573
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
574
 
575
+
576
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
577
 
578
+
579
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
580
 
581
+
582
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
583
 
584
+
585
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
586
 
587
+
588
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
589
 
590
+
591
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
592
 
593
+
594
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
595
 
596
+
597
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
598
 
599
+
600
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
601
 
602
+
603
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
604
 
605
+
606
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
607
 
608
+
609
  56%|█████▌ | 96/171 [00:08<00:01, 71.32it/s]
610
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
611
 
612
+
613
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
614
 
615
+
616
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
617
 
618
+
619
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
620
 
621
+
622
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
623
 
624
+
625
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
626
 
627
+
628
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
629
 
630
+
631
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
632
 
633
+
634
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
635
 
636
+
637
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
638
 
639
+
640
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
641
 
642
+
643
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
644
 
645
+
646
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
647
 
648
+
649
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
650
 
651
+
652
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
653
 
654
+
655
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
656
 
657
+
658
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
659
 
660
+
661
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
662
 
663
+
664
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
665
 
666
+
667
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
668
 
669
+
670
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
671
 
672
+
673
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
674
 
675
+
676
  64%|██████▍ | 110/171 [00:08<00:00, 73.99it/s]
677
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
678
 
679
+
680
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
681
 
682
+
683
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
684
 
685
+
686
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
687
 
688
+
689
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
690
 
691
+
692
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
693
 
694
+
695
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
696
 
697
+
698
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
699
 
700
+
701
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
702
 
703
+
704
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
705
 
706
+
707
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
708
 
709
+
710
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
711
 
712
+
713
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
714
 
715
+
716
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
717
 
718
+
719
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
720
 
721
+
722
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
723
 
724
+
725
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
726
 
727
+
728
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
729
 
730
+
731
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
732
 
733
+
734
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
735
 
736
+
737
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
738
 
739
+
740
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
741
 
742
+
743
  73%|███████▎ | 124/171 [00:08<00:00, 85.07it/s]
744
  81%|████████ | 138/171 [00:08<00:00, 94.74it/s]
745
 
746
+
747
  81%|████████ | 138/171 [00:08<00:00, 94.74it/s]
748
 
749
+
750
  81%|████████ | 138/171 [00:08<00:00, 94.74it/s]
751
 
752
+
753
  81%|████████ | 138/171 [00:08<00:00, 94.74it/s]
754
 
755
+
756
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
757
 
758
+
759
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
760
 
761
+
762
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
763
 
764
+
765
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
766
 
767
+
768
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
769
 
770
+
771
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
772
 
773
+
774
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
775
 
776
+
777
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
778
 
779
+
780
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
781
 
782
+
783
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
784
 
785
+
786
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
787
 
788
+
789
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
790
 
791
+
792
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
793
 
794
+
795
  81%|████████ | 138/171 [00:09<00:00, 94.74it/s]
796
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
797
 
798
+
799
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
800
 
801
+
802
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
803
 
804
+
805
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
806
 
807
+
808
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
809
 
810
+
811
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
812
 
813
+
814
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
815
 
816
+
817
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
818
 
819
+
820
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
821
 
822
+
823
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
824
 
825
+
826
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
827
 
828
+
829
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
830
 
831
+
832
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
833
 
834
+
835
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
836
 
837
+
838
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
839
 
840
+
841
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
842
 
843
+
844
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
845
 
846
+
847
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
848
 
849
+
850
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
851
 
852
+
853
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
854
 
855
+
856
  87%|████████▋ | 149/171 [00:09<00:00, 90.11it/s]
857
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
858
 
859
+
860
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
861
 
862
+
863
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
864
 
865
+
866
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
867
 
868
+
869
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
870
 
871
+
872
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
873
 
874
+
875
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
876
 
877
+
878
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
879
 
880
+
881
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
882
 
883
+
884
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
885
 
886
+
887
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
888
 
889
+
890
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
891
 
892
+
893
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
894
 
895
+
896
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
897
 
898
+
899
  95%|█████████▍| 162/171 [00:09<00:00, 97.51it/s]
900
+ [2024-06-04 03:31:48] INFO huggingface_loader.py:197: Unloading HF weight file: /models/Qwen1.5-0.5B-Chat/model.safetensors
901
+ [2024-06-04 03:31:48] INFO stats.py:77: Time usage: HF loading: 3.360 sec; Pre-quantization mapping: 2.166 sec; Quantization: 2.748 sec
902
+ [2024-06-04 03:31:48] INFO stats.py:91: RAM usage: Peak RAM: 2.308 GB. Total bytes loaded from disk: 2.308 GB
903
+ [2024-06-04 03:31:48] INFO convert_weight.py:155: Parameter size after quantization: 0.325 GB
904
+ [2024-06-04 03:31:48] INFO convert_weight.py:160: Total parameters: 619,570,176
905
+ [2024-06-04 03:31:48] INFO convert_weight.py:161: Bits per parameter: 4.502
906
+ [2024-06-04 03:31:48] INFO convert_weight.py:166: Saved to directory: /models/mlc-delivery/hf/mlc-ai/Qwen1.5-0.5B-Chat-q4f16_1-MLC
907
+
908
+ All finished, 8 total shards committed, record saved to /models/mlc-delivery/hf/mlc-ai/Qwen1.5-0.5B-Chat-q4f16_1-MLC/ndarray-cache.json
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "qwen2",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "hidden_act": "silu",
7
+ "hidden_size": 1024,
8
+ "intermediate_size": 2816,
9
+ "num_attention_heads": 16,
10
+ "num_hidden_layers": 24,
11
+ "num_key_value_heads": 16,
12
+ "rms_norm_eps": 1e-06,
13
+ "rope_theta": 1000000.0,
14
+ "vocab_size": 151936,
15
+ "context_window_size": 32768,
16
+ "prefill_chunk_size": 2048,
17
+ "tensor_parallel_shards": 1,
18
+ "head_dim": 64,
19
+ "dtype": "float32",
20
+ "max_batch_size": 80
21
+ },
22
+ "vocab_size": 151936,
23
+ "context_window_size": 32768,
24
+ "sliding_window_size": -1,
25
+ "prefill_chunk_size": 2048,
26
+ "attention_sink_size": -1,
27
+ "tensor_parallel_shards": 1,
28
+ "temperature": 1.0,
29
+ "presence_penalty": 0.0,
30
+ "frequency_penalty": 0.0,
31
+ "repetition_penalty": 1.1,
32
+ "top_p": 0.8,
33
+ "tokenizer_files": [
34
+ "tokenizer.json",
35
+ "vocab.json",
36
+ "merges.txt",
37
+ "tokenizer_config.json"
38
+ ],
39
+ "tokenizer_info": {
40
+ "token_postproc_method": "byte_level",
41
+ "prepend_space_in_encode": false,
42
+ "strip_space_in_decode": false
43
+ },
44
+ "conv_template": {
45
+ "name": "chatml",
46
+ "system_template": "<|im_start|>system\n{system_message}",
47
+ "system_message": "A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.",
48
+ "system_prefix_token_ids": null,
49
+ "add_role_after_system_message": true,
50
+ "roles": {
51
+ "user": "<|im_start|>user",
52
+ "assistant": "<|im_start|>assistant"
53
+ },
54
+ "role_templates": {
55
+ "user": "{user_message}",
56
+ "assistant": "{assistant_message}",
57
+ "tool": "{tool_message}"
58
+ },
59
+ "messages": [],
60
+ "seps": [
61
+ "<|im_end|>\n"
62
+ ],
63
+ "role_content_sep": "\n",
64
+ "role_empty_sep": "\n",
65
+ "stop_str": [
66
+ "<|im_end|>"
67
+ ],
68
+ "stop_token_ids": [
69
+ 2
70
+ ],
71
+ "function_string": "",
72
+ "use_function_calling": false
73
+ },
74
+ "pad_token_id": 151643,
75
+ "bos_token_id": 151643,
76
+ "eos_token_id": [
77
+ 151645,
78
+ 151643
79
+ ],
80
+ "mean_gen_len": 128,
81
+ "max_gen_len": 512,
82
+ "shift_fill_factor": 0.3
83
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6cdec4c05b14a3edfe1cb4f9997905139511034d77cb5d6f4b4731524a528be
3
+ size 77791232
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6cdec4c05b14a3edfe1cb4f9997905139511034d77cb5d6f4b4731524a528be
3
+ size 77791232
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4c2f1823ac925626866bacb00359cf838c1bfda0bc7e0f457aa89d36f9e9200
3
+ size 33329152
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e2c2275f36f20cd76b1b331911b40038457984f9083eadb47ff274ddde787a7
3
+ size 31156224
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:629f399433273fb57f7d28c35b1ed77e7d5cd36c86fdfa56f4018edf170b84c4
3
+ size 32194560
params_shard_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd38b0f9801c9860ceff5f64fb76b8a574305899ff2f4fefe6d45cb7a036971c
3
+ size 32925696
params_shard_6.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d24e952c343829ddbe4ce62963ca67ca7f7b800be4b1810199e52589e2be8a2
3
+ size 32194560
params_shard_7.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e3546b0fbf83efcfc8f2d5642fb3521b4d6a5b81c23b19bdd539a1601a9b385
3
+ size 31303680
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "151643": {
5
+ "content": "<|endoftext|>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "151644": {
13
+ "content": "<|im_start|>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "151645": {
21
+ "content": "<|im_end|>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ }
28
+ },
29
+ "additional_special_tokens": ["<|im_start|>", "<|im_end|>"],
30
+ "bos_token": null,
31
+ "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
32
+ "clean_up_tokenization_spaces": false,
33
+ "eos_token": "<|im_end|>",
34
+ "errors": "replace",
35
+ "model_max_length": 32768,
36
+ "pad_token": "<|endoftext|>",
37
+ "split_special_tokens": false,
38
+ "tokenizer_class": "Qwen2Tokenizer",
39
+ "unk_token": null
40
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff