Crystalcareai commited on
Commit
7aaee95
1 Parent(s): d90f4c5

Update configuration_gemmoe.py

Browse files
Files changed (1) hide show
  1. configuration_gemmoe.py +1 -1
configuration_gemmoe.py CHANGED
@@ -132,7 +132,7 @@ class GemmoeConfig(PretrainedConfig):
132
  attention_dropout=0.0,
133
  num_experts_per_tok=2,
134
  num_local_experts=8,
135
- router_aux_loss_coef=0.01,
136
  output_router_logits=False,
137
  **kwargs,
138
  ):
 
132
  attention_dropout=0.0,
133
  num_experts_per_tok=2,
134
  num_local_experts=8,
135
+ router_aux_loss_coef=0.02,
136
  output_router_logits=False,
137
  **kwargs,
138
  ):