keyfan commited on
Commit
a556a8d
1 Parent(s): ccee1b3

Fix rope base

Browse files
Files changed (1) hide show
  1. config.json +2 -2
config.json CHANGED
@@ -12,7 +12,7 @@
12
  "bos_token_id": 1,
13
  "embedding_multiplier_scale": 78.38367176906169,
14
  "eos_token_id": 2,
15
- "hidden_act": "gelu",
16
  "hidden_size": 6144,
17
  "initializer_range": 0.02,
18
  "intermediate_size": 32768,
@@ -27,7 +27,7 @@
27
  "output_router_logits": false,
28
  "pad_token_id": 0,
29
  "rms_norm_eps": 1e-05,
30
- "rope_theta": 100000.0,
31
  "router_aux_loss_coef": 0.02,
32
  "sliding_window": null,
33
  "torch_dtype": "bfloat16",
 
12
  "bos_token_id": 1,
13
  "embedding_multiplier_scale": 78.38367176906169,
14
  "eos_token_id": 2,
15
+ "hidden_act": "gelu_new",
16
  "hidden_size": 6144,
17
  "initializer_range": 0.02,
18
  "intermediate_size": 32768,
 
27
  "output_router_logits": false,
28
  "pad_token_id": 0,
29
  "rms_norm_eps": 1e-05,
30
+ "rope_theta": 10000.0,
31
  "router_aux_loss_coef": 0.02,
32
  "sliding_window": null,
33
  "torch_dtype": "bfloat16",