|
{ |
|
"architectures": [ |
|
"ILKTModel" |
|
], |
|
"auto_map": { |
|
"AutoConfig": "config.ILKTConfig", |
|
"AutoModel": "model.ILKTModel" |
|
}, |
|
"backbone_config": { |
|
"pretrained_model_name_or_path": "microsoft/mdeberta-v3-base", |
|
"trust_remote_code": true |
|
}, |
|
"cls_head_config": { |
|
"dropout": 0.0, |
|
"n_dense": 0, |
|
"pool_type": "cls", |
|
"use_batch_norm": true, |
|
"use_layer_norm": false |
|
}, |
|
"cls_heads": [], |
|
"embedding_head_config": { |
|
"dropout": 0.0, |
|
"n_dense": 1, |
|
"normalize_embeddings": false, |
|
"pool_type": "cls", |
|
"use_batch_norm": false, |
|
"use_layer_norm": false |
|
}, |
|
"hidden_size": 768, |
|
"mlm_head_config": { |
|
"dropout": 0.0, |
|
"n_dense": 0, |
|
"use_batch_norm": true, |
|
"use_layer_norm": false |
|
}, |
|
"model_type": "ILKT", |
|
"torch_dtype": "float32", |
|
"transformers_version": "4.41.2" |
|
} |
|
|