AbhayGoyal commited on
Commit
51752e7
1 Parent(s): 5e46c09

Training in progress, epoch 0

Browse files
Files changed (3) hide show
  1. config.json +1 -0
  2. pytorch_model.bin +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -14,6 +14,7 @@
14
  "model_type": "mixformer-sequential",
15
  "n_embd": 2048,
16
  "n_head": 32,
 
17
  "n_inner": null,
18
  "n_layer": 24,
19
  "n_positions": 2048,
 
14
  "model_type": "mixformer-sequential",
15
  "n_embd": 2048,
16
  "n_head": 32,
17
+ "n_head_kv": null,
18
  "n_inner": null,
19
  "n_layer": 24,
20
  "n_positions": 2048,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43a4a63f2d435a0442a4de1635743b6d9332b5fb66fc028c24ba059d54cd41a5
3
- size 5692078714
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b17c2dc43deda0b407d6494fd994f12acf9c29b32466494d19ee5740f5625b2b
3
+ size 5695215210
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:331348691d625372752ef9ea6ab27f1940db55643f38fbe6027a3bc08f201222
3
  size 4472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72d6946800a28ae52e747ce56e34f1c5efbfecdfc18316f18be057886367be3f
3
  size 4472