| { |
| "quant_cfg": { |
| "*weight_quantizer": { |
| "num_bits": [ |
| 2, |
| 1 |
| ], |
| "block_sizes": { |
| "-1": 16, |
| "type": "dynamic", |
| "scale_bits": [ |
| 4, |
| 3 |
| ] |
| }, |
| "enable": true |
| }, |
| "*input_quantizer": { |
| "enable": false |
| }, |
| "nn.BatchNorm1d": { |
| "*": { |
| "enable": false |
| } |
| }, |
| "nn.BatchNorm2d": { |
| "*": { |
| "enable": false |
| } |
| }, |
| "nn.BatchNorm3d": { |
| "*": { |
| "enable": false |
| } |
| }, |
| "nn.LeakyReLU": { |
| "*": { |
| "enable": false |
| } |
| }, |
| "*lm_head*": { |
| "enable": false |
| }, |
| "*proj_out.*": { |
| "enable": false |
| }, |
| "*block_sparse_moe.gate*": { |
| "enable": false |
| }, |
| "*router*": { |
| "enable": false |
| }, |
| "*mlp.gate.*": { |
| "enable": false |
| }, |
| "*mlp.shared_expert_gate.*": { |
| "enable": false |
| }, |
| "*linear_attn.conv1d*": { |
| "enable": false |
| }, |
| "*mixer.conv1d*": { |
| "enable": false |
| }, |
| "*output_layer*": { |
| "enable": false |
| }, |
| "output.*": { |
| "enable": false |
| }, |
| "default": { |
| "enable": false |
| }, |
| "*norm*": { |
| "enable": false |
| }, |
| "*layernorm*": { |
| "enable": false |
| }, |
| "*LayerNorm*": { |
| "enable": false |
| }, |
| "*rotary*": { |
| "enable": false |
| }, |
| "*bias*": { |
| "enable": false |
| }, |
| "lm_head*": { |
| "enable": false |
| }, |
| "lm_head.weight_quantizer": { |
| "enable": false |
| }, |
| "*visual.blocks.*.mlp.linear_fc1*": { |
| "enable": false |
| }, |
| "*visual.blocks.*.mlp.linear_fc2*": { |
| "enable": false |
| }, |
| "model.visual.blocks.*.mlp.linear_fc1*": { |
| "enable": false |
| }, |
| "model.visual.blocks.*.mlp.linear_fc2*": { |
| "enable": false |
| } |
| }, |
| "algorithm": null |
| } |