{ | |
"dropout": 0.1, | |
"hidden_dim": 768, | |
"intermediate_dim": 2048, | |
"max_seq_len": 128, | |
"n_head": 12, | |
"n_kv_head": 6, | |
"n_layer": 12, | |
"vocab_size": 1024 | |
} |
{ | |
"dropout": 0.1, | |
"hidden_dim": 768, | |
"intermediate_dim": 2048, | |
"max_seq_len": 128, | |
"n_head": 12, | |
"n_kv_head": 6, | |
"n_layer": 12, | |
"vocab_size": 1024 | |
} |