kalomaze commited on
Commit
c92c68d
1 Parent(s): c0f6592

add router aux loss coefficient

Browse files
Files changed (1) hide show
  1. config.json +3 -1
config.json CHANGED
@@ -17,9 +17,11 @@
17
  "num_hidden_layers": 32,
18
  "num_key_value_heads": 8,
19
  "num_local_experts": 8,
 
20
  "rms_norm_eps": 1e-05,
21
  "rope_theta": 10000.0,
22
- "sliding_window": 4096,
 
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
  "transformers_version": "4.41.1",
 
17
  "num_hidden_layers": 32,
18
  "num_key_value_heads": 8,
19
  "num_local_experts": 8,
20
+ "output_router_logits": false,
21
  "rms_norm_eps": 1e-05,
22
  "rope_theta": 10000.0,
23
+ "router_aux_loss_coef": 0.02,
24
+ "sliding_window": null,
25
  "tie_word_embeddings": false,
26
  "torch_dtype": "bfloat16",
27
  "transformers_version": "4.41.1",