THE-DDLM commited on
Commit
e42ae25
1 Parent(s): 69fe774
Files changed (2) hide show
  1. config.json +3 -3
  2. pytorch_model.bin +2 -2
config.json CHANGED
@@ -12,10 +12,10 @@
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
15
- "n_embd": 768,
16
- "n_head": 12,
17
  "n_inner": null,
18
- "n_layer": 12,
19
  "n_positions": 1024,
20
  "reorder_and_upcast_attn": false,
21
  "resid_pdrop": 0.1,
 
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
15
+ "n_embd": 1024,
16
+ "n_head": 16,
17
  "n_inner": null,
18
+ "n_layer": 24,
19
  "n_positions": 1024,
20
  "reorder_and_upcast_attn": false,
21
  "resid_pdrop": 0.1,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:702f4ba25140a87f6803f8498ee26035c7042162527b4820dc22af263e8a1242
3
- size 510394089
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a8a830914c0a5e04b7a5752311f5b1f87a1a82332cdb3928d139dc65994bf01
3
+ size 1444562137