File size: 663 Bytes
afdb7c4 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 |
# Importing libraries
from transformers import PretrainedConfig
class GPTConfig(PretrainedConfig):
model_type = "custom_gpt"
def __init__(
self,
block_size: int = 1024,
vocab_size: int = 50304,
n_layer: int = 12,
n_head: int = 12,
n_embd: int = 768,
**kwargs,
):
"""
GPT configuration dataclass storing model hyperparameters.
"""
super().__init__(**kwargs)
self.block_size = block_size
self.vocab_size = vocab_size
self.n_layer: int = n_layer
self.n_head: int = n_head
self.n_embd: int = n_embd
|