Transformers
PyTorch
Chinese
Inference Endpoints
EVA2.0-base / config.json
t1101675's picture
Upload config.json
e2edef0
raw
history blame
306 Bytes
{
"d_model": 768,
"d_ff": 3072,
"d_kv": 64,
"num_heads": 12,
"num_layers": 12,
"num_decoder_layers": 12,
"dropout_rate": 0.0,
"init_method_std": 0.001,
"initializer_factor": 1.0,
"layer_norm_epsilon": 1e-06,
"max_position_embeddings": 512,
"use_cache": false,
"attn_scale": true
}