GeneZC commited on
Commit
457d807
1 Parent(s): b72a6f9

Upload 5 files

Browse files
config.json ADDED
@@ -0,0 +1,705 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "../plms/bert-base-uncased",
3
+ "architectures": [
4
+ "SparseBertHidden"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "gradient_checkpointing": false,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 768,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-12,
15
+ "layer_skip": 1,
16
+ "max_position_embeddings": 512,
17
+ "model_type": "bert",
18
+ "num_attention_heads": 12,
19
+ "num_hidden_layers": 12,
20
+ "pad_token_id": 0,
21
+ "position_embedding_type": "absolute",
22
+ "sparsity": "0",
23
+ "sparsity_map": {
24
+ "0": {
25
+ "head": {},
26
+ "hidden": {
27
+ "-1": 0,
28
+ "0": 0,
29
+ "1": 0,
30
+ "10": 0,
31
+ "11": 0,
32
+ "2": 0,
33
+ "3": 0,
34
+ "4": 0,
35
+ "5": 0,
36
+ "6": 0,
37
+ "7": 0,
38
+ "8": 0,
39
+ "9": 0
40
+ },
41
+ "neuron": {}
42
+ },
43
+ "10": {
44
+ "head": {
45
+ "1": 5,
46
+ "11": 1,
47
+ "3": 1
48
+ },
49
+ "hidden": {
50
+ "-1": 38,
51
+ "0": 38,
52
+ "1": 38,
53
+ "10": 38,
54
+ "11": 38,
55
+ "2": 38,
56
+ "3": 38,
57
+ "4": 38,
58
+ "5": 38,
59
+ "6": 38,
60
+ "7": 38,
61
+ "8": 38,
62
+ "9": 38
63
+ },
64
+ "neuron": {
65
+ "0": 190,
66
+ "1": 298,
67
+ "11": 1,
68
+ "2": 1323,
69
+ "3": 4,
70
+ "4": 5,
71
+ "5": 8,
72
+ "6": 4,
73
+ "7": 7,
74
+ "8": 2,
75
+ "9": 1
76
+ }
77
+ },
78
+ "20": {
79
+ "head": {
80
+ "0": 1,
81
+ "1": 7,
82
+ "10": 1,
83
+ "11": 4,
84
+ "3": 2,
85
+ "9": 1
86
+ },
87
+ "hidden": {
88
+ "-1": 84,
89
+ "0": 84,
90
+ "1": 84,
91
+ "10": 84,
92
+ "11": 84,
93
+ "2": 84,
94
+ "3": 84,
95
+ "4": 84,
96
+ "5": 84,
97
+ "6": 84,
98
+ "7": 84,
99
+ "8": 84,
100
+ "9": 84
101
+ },
102
+ "neuron": {
103
+ "0": 597,
104
+ "1": 802,
105
+ "11": 16,
106
+ "2": 2294,
107
+ "3": 48,
108
+ "4": 78,
109
+ "5": 123,
110
+ "6": 22,
111
+ "7": 47,
112
+ "8": 23,
113
+ "9": 5
114
+ }
115
+ },
116
+ "30": {
117
+ "head": {
118
+ "0": 1,
119
+ "1": 8,
120
+ "10": 2,
121
+ "11": 4,
122
+ "2": 1,
123
+ "3": 2,
124
+ "6": 1,
125
+ "7": 1,
126
+ "8": 1,
127
+ "9": 2
128
+ },
129
+ "hidden": {
130
+ "-1": 123,
131
+ "0": 123,
132
+ "1": 123,
133
+ "10": 123,
134
+ "11": 123,
135
+ "2": 123,
136
+ "3": 123,
137
+ "4": 123,
138
+ "5": 123,
139
+ "6": 123,
140
+ "7": 123,
141
+ "8": 123,
142
+ "9": 123
143
+ },
144
+ "neuron": {
145
+ "0": 980,
146
+ "1": 1233,
147
+ "10": 2,
148
+ "11": 116,
149
+ "2": 2512,
150
+ "3": 132,
151
+ "4": 233,
152
+ "5": 386,
153
+ "6": 61,
154
+ "7": 146,
155
+ "8": 73,
156
+ "9": 24
157
+ }
158
+ },
159
+ "40": {
160
+ "head": {
161
+ "0": 3,
162
+ "1": 8,
163
+ "10": 2,
164
+ "11": 5,
165
+ "2": 1,
166
+ "3": 3,
167
+ "4": 2,
168
+ "5": 1,
169
+ "6": 2,
170
+ "7": 1,
171
+ "8": 1,
172
+ "9": 4
173
+ },
174
+ "hidden": {
175
+ "-1": 177,
176
+ "0": 177,
177
+ "1": 177,
178
+ "10": 177,
179
+ "11": 177,
180
+ "2": 177,
181
+ "3": 177,
182
+ "4": 177,
183
+ "5": 177,
184
+ "6": 177,
185
+ "7": 177,
186
+ "8": 177,
187
+ "9": 177
188
+ },
189
+ "neuron": {
190
+ "0": 1436,
191
+ "1": 1664,
192
+ "10": 6,
193
+ "11": 518,
194
+ "2": 2634,
195
+ "3": 306,
196
+ "4": 449,
197
+ "5": 732,
198
+ "6": 138,
199
+ "7": 321,
200
+ "8": 184,
201
+ "9": 91
202
+ }
203
+ },
204
+ "50": {
205
+ "head": {
206
+ "0": 5,
207
+ "1": 8,
208
+ "10": 3,
209
+ "11": 5,
210
+ "2": 2,
211
+ "3": 3,
212
+ "4": 3,
213
+ "5": 2,
214
+ "6": 3,
215
+ "7": 2,
216
+ "8": 2,
217
+ "9": 4
218
+ },
219
+ "hidden": {
220
+ "-1": 223,
221
+ "0": 223,
222
+ "1": 223,
223
+ "10": 223,
224
+ "11": 223,
225
+ "2": 223,
226
+ "3": 223,
227
+ "4": 223,
228
+ "5": 223,
229
+ "6": 223,
230
+ "7": 223,
231
+ "8": 223,
232
+ "9": 223
233
+ },
234
+ "neuron": {
235
+ "0": 1749,
236
+ "1": 1933,
237
+ "10": 21,
238
+ "11": 915,
239
+ "2": 2699,
240
+ "3": 519,
241
+ "4": 664,
242
+ "5": 976,
243
+ "6": 252,
244
+ "7": 469,
245
+ "8": 307,
246
+ "9": 187
247
+ }
248
+ },
249
+ "60": {
250
+ "head": {
251
+ "0": 6,
252
+ "1": 8,
253
+ "10": 5,
254
+ "11": 7,
255
+ "2": 3,
256
+ "3": 4,
257
+ "4": 4,
258
+ "5": 3,
259
+ "6": 5,
260
+ "7": 2,
261
+ "8": 2,
262
+ "9": 4
263
+ },
264
+ "hidden": {
265
+ "-1": 284,
266
+ "0": 284,
267
+ "1": 284,
268
+ "10": 284,
269
+ "11": 284,
270
+ "2": 284,
271
+ "3": 284,
272
+ "4": 284,
273
+ "5": 284,
274
+ "6": 284,
275
+ "7": 284,
276
+ "8": 284,
277
+ "9": 284
278
+ },
279
+ "neuron": {
280
+ "0": 2065,
281
+ "1": 2200,
282
+ "10": 67,
283
+ "11": 1392,
284
+ "2": 2762,
285
+ "3": 817,
286
+ "4": 991,
287
+ "5": 1279,
288
+ "6": 454,
289
+ "7": 695,
290
+ "8": 521,
291
+ "9": 397
292
+ }
293
+ },
294
+ "70": {
295
+ "head": {
296
+ "0": 6,
297
+ "1": 8,
298
+ "10": 6,
299
+ "11": 7,
300
+ "2": 4,
301
+ "3": 6,
302
+ "4": 4,
303
+ "5": 5,
304
+ "6": 6,
305
+ "7": 3,
306
+ "8": 5,
307
+ "9": 5
308
+ },
309
+ "hidden": {
310
+ "-1": 346,
311
+ "0": 346,
312
+ "1": 346,
313
+ "10": 346,
314
+ "11": 346,
315
+ "2": 346,
316
+ "3": 346,
317
+ "4": 346,
318
+ "5": 346,
319
+ "6": 346,
320
+ "7": 346,
321
+ "8": 346,
322
+ "9": 346
323
+ },
324
+ "neuron": {
325
+ "0": 2266,
326
+ "1": 2390,
327
+ "10": 206,
328
+ "11": 1745,
329
+ "2": 2820,
330
+ "3": 1173,
331
+ "4": 1308,
332
+ "5": 1537,
333
+ "6": 694,
334
+ "7": 951,
335
+ "8": 791,
336
+ "9": 708
337
+ }
338
+ },
339
+ "80": {
340
+ "head": {
341
+ "0": 6,
342
+ "1": 9,
343
+ "10": 8,
344
+ "11": 8,
345
+ "2": 6,
346
+ "3": 6,
347
+ "4": 6,
348
+ "5": 9,
349
+ "6": 7,
350
+ "7": 4,
351
+ "8": 5,
352
+ "9": 5
353
+ },
354
+ "hidden": {
355
+ "-1": 422,
356
+ "0": 422,
357
+ "1": 422,
358
+ "10": 422,
359
+ "11": 422,
360
+ "2": 422,
361
+ "3": 422,
362
+ "4": 422,
363
+ "5": 422,
364
+ "6": 422,
365
+ "7": 422,
366
+ "8": 422,
367
+ "9": 422
368
+ },
369
+ "neuron": {
370
+ "0": 2450,
371
+ "1": 2541,
372
+ "10": 574,
373
+ "11": 2105,
374
+ "2": 2863,
375
+ "3": 1559,
376
+ "4": 1676,
377
+ "5": 1862,
378
+ "6": 1071,
379
+ "7": 1294,
380
+ "8": 1154,
381
+ "9": 1126
382
+ }
383
+ },
384
+ "85": {
385
+ "head": {
386
+ "0": 6,
387
+ "1": 9,
388
+ "10": 10,
389
+ "11": 8,
390
+ "2": 6,
391
+ "3": 6,
392
+ "4": 7,
393
+ "5": 9,
394
+ "6": 8,
395
+ "7": 7,
396
+ "8": 5,
397
+ "9": 7
398
+ },
399
+ "hidden": {
400
+ "-1": 468,
401
+ "0": 468,
402
+ "1": 468,
403
+ "10": 468,
404
+ "11": 468,
405
+ "2": 468,
406
+ "3": 468,
407
+ "4": 468,
408
+ "5": 468,
409
+ "6": 468,
410
+ "7": 468,
411
+ "8": 468,
412
+ "9": 468
413
+ },
414
+ "neuron": {
415
+ "0": 2554,
416
+ "1": 2635,
417
+ "10": 936,
418
+ "11": 2278,
419
+ "2": 2889,
420
+ "3": 1780,
421
+ "4": 1836,
422
+ "5": 2037,
423
+ "6": 1292,
424
+ "7": 1489,
425
+ "8": 1360,
426
+ "9": 1401
427
+ }
428
+ },
429
+ "90": {
430
+ "head": {
431
+ "0": 6,
432
+ "1": 9,
433
+ "10": 11,
434
+ "11": 8,
435
+ "2": 7,
436
+ "3": 7,
437
+ "4": 9,
438
+ "5": 9,
439
+ "6": 9,
440
+ "7": 9,
441
+ "8": 6,
442
+ "9": 8
443
+ },
444
+ "hidden": {
445
+ "-1": 522,
446
+ "0": 522,
447
+ "1": 522,
448
+ "10": 522,
449
+ "11": 522,
450
+ "2": 522,
451
+ "3": 522,
452
+ "4": 522,
453
+ "5": 522,
454
+ "6": 522,
455
+ "7": 522,
456
+ "8": 522,
457
+ "9": 522
458
+ },
459
+ "neuron": {
460
+ "0": 2653,
461
+ "1": 2713,
462
+ "10": 1390,
463
+ "11": 2433,
464
+ "2": 2913,
465
+ "3": 2013,
466
+ "4": 2064,
467
+ "5": 2243,
468
+ "6": 1569,
469
+ "7": 1741,
470
+ "8": 1648,
471
+ "9": 1688
472
+ }
473
+ },
474
+ "95": {
475
+ "head": {
476
+ "0": 8,
477
+ "1": 10,
478
+ "10": 11,
479
+ "11": 9,
480
+ "2": 9,
481
+ "3": 9,
482
+ "4": 9,
483
+ "5": 9,
484
+ "6": 11,
485
+ "7": 9,
486
+ "8": 9,
487
+ "9": 9
488
+ },
489
+ "hidden": {
490
+ "-1": 599,
491
+ "0": 599,
492
+ "1": 599,
493
+ "10": 599,
494
+ "11": 599,
495
+ "2": 599,
496
+ "3": 599,
497
+ "4": 599,
498
+ "5": 599,
499
+ "6": 599,
500
+ "7": 599,
501
+ "8": 599,
502
+ "9": 599
503
+ },
504
+ "neuron": {
505
+ "0": 2753,
506
+ "1": 2799,
507
+ "10": 2001,
508
+ "11": 2654,
509
+ "2": 2948,
510
+ "3": 2337,
511
+ "4": 2381,
512
+ "5": 2519,
513
+ "6": 1992,
514
+ "7": 2148,
515
+ "8": 2061,
516
+ "9": 2161
517
+ }
518
+ },
519
+ "96": {
520
+ "head": {
521
+ "0": 9,
522
+ "1": 10,
523
+ "10": 11,
524
+ "11": 10,
525
+ "2": 9,
526
+ "3": 9,
527
+ "4": 9,
528
+ "5": 10,
529
+ "6": 11,
530
+ "7": 9,
531
+ "8": 9,
532
+ "9": 9
533
+ },
534
+ "hidden": {
535
+ "-1": 614,
536
+ "0": 614,
537
+ "1": 614,
538
+ "10": 614,
539
+ "11": 614,
540
+ "2": 614,
541
+ "3": 614,
542
+ "4": 614,
543
+ "5": 614,
544
+ "6": 614,
545
+ "7": 614,
546
+ "8": 614,
547
+ "9": 614
548
+ },
549
+ "neuron": {
550
+ "0": 2768,
551
+ "1": 2822,
552
+ "10": 2133,
553
+ "11": 2689,
554
+ "2": 2955,
555
+ "3": 2392,
556
+ "4": 2439,
557
+ "5": 2579,
558
+ "6": 2077,
559
+ "7": 2223,
560
+ "8": 2148,
561
+ "9": 2266
562
+ }
563
+ },
564
+ "97": {
565
+ "head": {
566
+ "0": 10,
567
+ "1": 10,
568
+ "10": 11,
569
+ "11": 10,
570
+ "2": 9,
571
+ "3": 9,
572
+ "4": 9,
573
+ "5": 10,
574
+ "6": 11,
575
+ "7": 10,
576
+ "8": 11,
577
+ "9": 10
578
+ },
579
+ "hidden": {
580
+ "-1": 637,
581
+ "0": 637,
582
+ "1": 637,
583
+ "10": 637,
584
+ "11": 637,
585
+ "2": 637,
586
+ "3": 637,
587
+ "4": 637,
588
+ "5": 637,
589
+ "6": 637,
590
+ "7": 637,
591
+ "8": 637,
592
+ "9": 637
593
+ },
594
+ "neuron": {
595
+ "0": 2799,
596
+ "1": 2846,
597
+ "10": 2294,
598
+ "11": 2746,
599
+ "2": 2970,
600
+ "3": 2487,
601
+ "4": 2537,
602
+ "5": 2656,
603
+ "6": 2207,
604
+ "7": 2355,
605
+ "8": 2291,
606
+ "9": 2409
607
+ }
608
+ },
609
+ "98": {
610
+ "head": {
611
+ "0": 11,
612
+ "1": 10,
613
+ "10": 11,
614
+ "11": 10,
615
+ "2": 10,
616
+ "3": 10,
617
+ "4": 10,
618
+ "5": 10,
619
+ "6": 11,
620
+ "7": 10,
621
+ "8": 11,
622
+ "9": 10
623
+ },
624
+ "hidden": {
625
+ "-1": 660,
626
+ "0": 660,
627
+ "1": 660,
628
+ "10": 660,
629
+ "11": 660,
630
+ "2": 660,
631
+ "3": 660,
632
+ "4": 660,
633
+ "5": 660,
634
+ "6": 660,
635
+ "7": 660,
636
+ "8": 660,
637
+ "9": 660
638
+ },
639
+ "neuron": {
640
+ "0": 2826,
641
+ "1": 2870,
642
+ "10": 2455,
643
+ "11": 2794,
644
+ "2": 2984,
645
+ "3": 2588,
646
+ "4": 2634,
647
+ "5": 2726,
648
+ "6": 2350,
649
+ "7": 2501,
650
+ "8": 2440,
651
+ "9": 2535
652
+ }
653
+ },
654
+ "99": {
655
+ "head": {
656
+ "0": 11,
657
+ "1": 10,
658
+ "10": 11,
659
+ "11": 11,
660
+ "2": 11,
661
+ "3": 11,
662
+ "4": 11,
663
+ "5": 11,
664
+ "6": 11,
665
+ "7": 11,
666
+ "8": 11,
667
+ "9": 10
668
+ },
669
+ "hidden": {
670
+ "-1": 691,
671
+ "0": 691,
672
+ "1": 691,
673
+ "10": 691,
674
+ "11": 691,
675
+ "2": 691,
676
+ "3": 691,
677
+ "4": 691,
678
+ "5": 691,
679
+ "6": 691,
680
+ "7": 691,
681
+ "8": 691,
682
+ "9": 691
683
+ },
684
+ "neuron": {
685
+ "0": 2861,
686
+ "1": 2915,
687
+ "10": 2683,
688
+ "11": 2862,
689
+ "2": 2998,
690
+ "3": 2709,
691
+ "4": 2746,
692
+ "5": 2845,
693
+ "6": 2551,
694
+ "7": 2678,
695
+ "8": 2635,
696
+ "9": 2695
697
+ }
698
+ }
699
+ },
700
+ "torch_dtype": "float32",
701
+ "transformers_version": "4.12.0",
702
+ "type_vocab_size": 2,
703
+ "use_cache": true,
704
+ "vocab_size": 30522
705
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56a41b64b6df1ddee8da268b5f67b714ef3b198e9eee1c97b1d0fb0b067684ce
3
+ size 440508517
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"do_lower_case": true, "do_basic_tokenize": true, "never_split": null, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "../plms/bert-base-uncased", "use_fast": true, "tokenizer_file": null, "tokenizer_class": "BertTokenizer"}
vocab.txt ADDED
The diff for this file is too large to render. See raw diff