stefan-it commited on
Commit
5d0d7d4
1 Parent(s): 5218064

model: add new checkpoint for GC4 ELECTRA model

Browse files
.gitattributes CHANGED
@@ -14,3 +14,6 @@
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
 
 
 
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
17
+ *.meta filter=lfs diff=lfs merge=lfs -text
18
+ *.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
19
+ *.index filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "electra-base-gc4-64k-200000-cased-generator",
3
+ "architectures": [
4
+ "ElectraForMaskedLM"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "embedding_size": 768,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 256,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 1024,
13
+ "layer_norm_eps": 1e-12,
14
+ "max_position_embeddings": 512,
15
+ "model_type": "electra",
16
+ "num_attention_heads": 4,
17
+ "num_hidden_layers": 12,
18
+ "pad_token_id": 0,
19
+ "position_embedding_type": "absolute",
20
+ "summary_activation": "gelu",
21
+ "summary_last_dropout": 0.1,
22
+ "summary_type": "first",
23
+ "summary_use_proj": true,
24
+ "transformers_version": "4.6.0.dev0",
25
+ "type_vocab_size": 2,
26
+ "vocab_size": 64000
27
+ }
model.ckpt-200000.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22db1d3eb67df00e37970237e02b3119aa4f04a9f68118399a4c49002102c8df
3
+ size 1741572116
model.ckpt-200000.index ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:887fa02d08707b069df405554cea9d4d5d31d1881ca98512f619965d9e150ac7
3
+ size 18023
model.ckpt-200000.meta ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba9cc364662a6c6089d315a3f08b494070e217351da9afd3202f657010f8fc8b
3
+ size 9227280
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00c1d062a2065cb0a113756d8a8b2fec42a97f76cd5258ce84eece9b6a4487e6
3
+ size 238029732
tf_model.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02d0b182be441afdf6ec0e0fc4e511739c85a0ef0a6d67a44b9ca19abf2b99f7
3
+ size 436414984