teddy-f-47 commited on
Commit
00d7428
1 Parent(s): 22200d0

Update configuration_phi.py

Browse files
Files changed (1) hide show
  1. configuration_phi.py +4 -4
configuration_phi.py CHANGED
@@ -21,11 +21,11 @@ class PhiConfig(PretrainedConfig):
21
  def __init__(
22
  self,
23
  vocab_size: int = 50295,
24
- n_positions: int = 2048,
25
  n_embd: int = 1024,
26
- n_layer: int = 20,
27
  n_inner: Optional[int] = None,
28
- n_head: int = 16,
29
  n_head_kv: Optional[int] = None,
30
  rotary_dim: Optional[int] = 32,
31
  activation_function: Optional[str] = "gelu_new",
@@ -41,7 +41,7 @@ class PhiConfig(PretrainedConfig):
41
  pad_vocab_size_multiple: int = 64,
42
  **kwargs
43
  ) -> None:
44
- self.vocab_size = int(math.ceil(vocab_size / pad_vocab_size_multiple) * pad_vocab_size_multiple)
45
  self.n_positions = n_positions
46
  self.n_embd = n_embd
47
  self.n_layer = n_layer
 
21
  def __init__(
22
  self,
23
  vocab_size: int = 50295,
24
+ n_positions: int = 1024,
25
  n_embd: int = 1024,
26
+ n_layer: int = 24,
27
  n_inner: Optional[int] = None,
28
+ n_head: int = 32,
29
  n_head_kv: Optional[int] = None,
30
  rotary_dim: Optional[int] = 32,
31
  activation_function: Optional[str] = "gelu_new",
 
41
  pad_vocab_size_multiple: int = 64,
42
  **kwargs
43
  ) -> None:
44
+ self.vocab_size = vocab_size
45
  self.n_positions = n_positions
46
  self.n_embd = n_embd
47
  self.n_layer = n_layer