cross-sentence-GEC / config.json
kellywong
upload model and tokenizer
67cdd43
{
"architectures": [
"CSGModel"
],
"beam_size": 12,
"ctx_max_seq_len": 1024,
"dropout": 0.2,
"embedding_dim": 500,
"eos_idx": 2,
"hidden_dim": 1024,
"initializer_range": 0.02,
"kernel_size": 3,
"num_aux_encoders": 3,
"num_decoders": 7,
"num_encoders": 7,
"padding_idx": 1,
"source_vocab_size": 30004,
"src_max_seq_len": 1024,
"target_vocab_size": 30004,
"torch_dtype": "float32",
"transformers_version": "4.10.2",
"trg_max_seq_len": 1024
}