from dataclasses import dataclass @dataclass class LlamaConfig: hidden_size: int = 576 num_attention_heads: int = 16 num_key_value_heads: int = 4 num_hidden_layers: int = 30 intermediate_size: int = 1536 hidden_act: str = "silu" rms_norm_eps: float = 1e-5 vocab_size: int = 49152 max_position_embeddings: int = 8192 rope_theta: int = 100000 tie_word_embeddings: bool = False