RITA_xl / config.json
DanielHesslow's picture
Update config.json
40473fe
raw
history blame contribute delete
656 Bytes
{
"_name_or_path": "Seledorn/RITA_xl",
"architectures": [
"RITAModelForCausalLM"
],
"auto_map": {
"AutoConfig": "rita_configuration.RITAConfig",
"AutoModel": "rita_modeling.RITAModel",
"AutoModelForCausalLM": "rita_modeling.RITAModelForCausalLM",
"AutoModelForSequenceClassification": "rita_modeling.RITAModelForSequenceClassification"
},
"d_feedforward": 8192,
"d_model": 2048,
"dropout": 0.0,
"eos_token_id": 50256,
"initializer_range": 0.02,
"max_seq_len": 1024,
"model_type": "rita",
"num_heads": 32,
"num_layers": 24,
"torch_dtype": "float16",
"transformers_version": "4.18.0",
"vocab_size": 26
}