mindi-backup / final_model /configuration_mindi.py
Mindigenous
Sync latest workspace state: data/scripts updates and archive cleanup
5ae3e12
"""
Hugging Face config class for MINDI 1.0 420M.
"""
from transformers import PretrainedConfig
class MindiConfig(PretrainedConfig):
model_type = "mindi"
def __init__(
self,
vocab_size=50000,
max_seq_len=2048,
d_model=1152,
n_layers=23,
n_heads=16,
d_ff=4608,
dropout=0.1,
tie_embeddings=True,
init_std=0.02,
rms_norm_eps=1e-5,
bos_token_id=2,
eos_token_id=3,
pad_token_id=0,
**kwargs,
):
super().__init__(bos_token_id=bos_token_id, eos_token_id=eos_token_id, pad_token_id=pad_token_id, **kwargs)
self.vocab_size = vocab_size
self.max_seq_len = max_seq_len
self.d_model = d_model
self.n_layers = n_layers
self.n_heads = n_heads
self.d_ff = d_ff
self.dropout = dropout
self.tie_embeddings = tie_embeddings
self.init_std = init_std
self.rms_norm_eps = rms_norm_eps