stefan-it commited on
Commit
b82bad4
1 Parent(s): 11e3f1d

model: add new checkpoint for GC4 ELECTRA model

Browse files
.gitattributes CHANGED
@@ -14,3 +14,6 @@
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
 
 
 
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
17
+ *.meta filter=lfs diff=lfs merge=lfs -text
18
+ *.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
19
+ *.index filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "electra-base-gc4-64k-900000-cased-generator",
3
+ "architectures": [
4
+ "ElectraForMaskedLM"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "embedding_size": 768,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 256,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 1024,
13
+ "layer_norm_eps": 1e-12,
14
+ "max_position_embeddings": 512,
15
+ "model_type": "electra",
16
+ "num_attention_heads": 4,
17
+ "num_hidden_layers": 12,
18
+ "pad_token_id": 0,
19
+ "position_embedding_type": "absolute",
20
+ "summary_activation": "gelu",
21
+ "summary_last_dropout": 0.1,
22
+ "summary_type": "first",
23
+ "summary_use_proj": true,
24
+ "transformers_version": "4.6.0.dev0",
25
+ "type_vocab_size": 2,
26
+ "vocab_size": 64000
27
+ }
model.ckpt-900000.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d66b2743df1ab92ef3e5e93f6169024db2ef9644ab661bf879e969c717ca1734
3
+ size 1741572116
model.ckpt-900000.index ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2305a84c64adb99e6a9644950866881acb49a553f84a38db2a8beebd02f90696
3
+ size 18011
model.ckpt-900000.meta ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5da12b945e1573443949a5cd16db1ea7df1ce5c158e7252699bd06bff6a7848
3
+ size 9227280
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e12784acb0bda1c17baf2ac74776a087d286614b8964e237883f1d4f32890b81
3
+ size 238029732
tf_model.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7d897a9dc75b5a7230d9846db98468eefbe52d8218ef12433f9902f5a39e55c
3
+ size 436414984