nncf-qat-kd-bert-l-squadv1.1-sl256 / nncf_bert_config_squad_kd.json
Vui Seng Chua
Add content
c65b8ea
{
"input_info": [
{
"sample_size": [1, 256],
"type": "long"
},
{
"sample_size": [1, 256],
"type": "long"
},
{
"sample_size": [1, 256],
"type": "long"
}
],
"compression": [{
"algorithm": "quantization",
"initializer": {
"range": {
"num_init_samples": 32,
"type": "percentile",
"params":
{
"min_percentile": 0.01,
"max_percentile": 99.99
}
},
"batchnorm_adaptation": {
"num_bn_adaptation_samples": 200
}
},
"activations":
{
"mode": "symmetric"
},
"weights":
{
"mode": "symmetric",
"signed": true,
"per_channel": false
}
},
{
"algorithm": "knowledge_distillation",
"type": "softmax",
"temperature": 3
}
]
}