teddy-f-47
commited on
Commit
•
00d7428
1
Parent(s):
22200d0
Update configuration_phi.py
Browse files- configuration_phi.py +4 -4
configuration_phi.py
CHANGED
@@ -21,11 +21,11 @@ class PhiConfig(PretrainedConfig):
|
|
21 |
def __init__(
|
22 |
self,
|
23 |
vocab_size: int = 50295,
|
24 |
-
n_positions: int =
|
25 |
n_embd: int = 1024,
|
26 |
-
n_layer: int =
|
27 |
n_inner: Optional[int] = None,
|
28 |
-
n_head: int =
|
29 |
n_head_kv: Optional[int] = None,
|
30 |
rotary_dim: Optional[int] = 32,
|
31 |
activation_function: Optional[str] = "gelu_new",
|
@@ -41,7 +41,7 @@ class PhiConfig(PretrainedConfig):
|
|
41 |
pad_vocab_size_multiple: int = 64,
|
42 |
**kwargs
|
43 |
) -> None:
|
44 |
-
self.vocab_size =
|
45 |
self.n_positions = n_positions
|
46 |
self.n_embd = n_embd
|
47 |
self.n_layer = n_layer
|
|
|
21 |
def __init__(
|
22 |
self,
|
23 |
vocab_size: int = 50295,
|
24 |
+
n_positions: int = 1024,
|
25 |
n_embd: int = 1024,
|
26 |
+
n_layer: int = 24,
|
27 |
n_inner: Optional[int] = None,
|
28 |
+
n_head: int = 32,
|
29 |
n_head_kv: Optional[int] = None,
|
30 |
rotary_dim: Optional[int] = 32,
|
31 |
activation_function: Optional[str] = "gelu_new",
|
|
|
41 |
pad_vocab_size_multiple: int = 64,
|
42 |
**kwargs
|
43 |
) -> None:
|
44 |
+
self.vocab_size = vocab_size
|
45 |
self.n_positions = n_positions
|
46 |
self.n_embd = n_embd
|
47 |
self.n_layer = n_layer
|