lvwerra HF staff commited on
Commit
c12d373
1 Parent(s): 2c4c5b3

fix config.json

Browse files
Files changed (1) hide show
  1. config.json +4 -4
config.json CHANGED
@@ -5,10 +5,10 @@
5
  "GPT2LMHeadModel"
6
  ],
7
  "attn_pdrop": 0.1,
8
- "bos_token_id": 50256,
9
  "embd_pdrop": 0.1,
10
- "eos_token_id": 50256,
11
- "gradient_checkpointing": true,
12
  "initializer_range": 0.02,
13
  "layer_norm_epsilon": 1e-05,
14
  "model_type": "gpt2",
@@ -21,7 +21,7 @@
21
  "output_past": true,
22
  "reorder_and_upcast_attn": true,
23
  "resid_pdrop": 0.1,
24
- "scale_attn_by_layer_idx": true,
25
  "scale_attn_weights": true,
26
  "summary_activation": null,
27
  "summary_first_dropout": 0.1,
 
5
  "GPT2LMHeadModel"
6
  ],
7
  "attn_pdrop": 0.1,
8
+ "bos_token_id": 0,
9
  "embd_pdrop": 0.1,
10
+ "eos_token_id": 0,
11
+ "gradient_checkpointing": false,
12
  "initializer_range": 0.02,
13
  "layer_norm_epsilon": 1e-05,
14
  "model_type": "gpt2",
 
21
  "output_past": true,
22
  "reorder_and_upcast_attn": true,
23
  "resid_pdrop": 0.1,
24
+ "scale_attn_by_inverse_layer_idx": true,
25
  "scale_attn_weights": true,
26
  "summary_activation": null,
27
  "summary_first_dropout": 0.1,