Crystalcareai
commited on
Commit
•
7aaee95
1
Parent(s):
d90f4c5
Update configuration_gemmoe.py
Browse files- configuration_gemmoe.py +1 -1
configuration_gemmoe.py
CHANGED
@@ -132,7 +132,7 @@ class GemmoeConfig(PretrainedConfig):
|
|
132 |
attention_dropout=0.0,
|
133 |
num_experts_per_tok=2,
|
134 |
num_local_experts=8,
|
135 |
-
router_aux_loss_coef=0.
|
136 |
output_router_logits=False,
|
137 |
**kwargs,
|
138 |
):
|
|
|
132 |
attention_dropout=0.0,
|
133 |
num_experts_per_tok=2,
|
134 |
num_local_experts=8,
|
135 |
+
router_aux_loss_coef=0.02,
|
136 |
output_router_logits=False,
|
137 |
**kwargs,
|
138 |
):
|