{ | |
"device": "cuda", | |
"dropout": 0.2, | |
"n_blocks": 3, | |
"transformer_config": { | |
"block_size": 500, | |
"dropout": 0.2, | |
"n_embd": 388, | |
"n_head": 8 | |
}, | |
"vocab_size": 8010, | |
"xlstm_config": { | |
"batch_size": 16, | |
"block_size": 500, | |
"config_block": "msm", | |
"device": "cuda", | |
"n_embd": 388 | |
} | |
} |