stefan-it commited on
Commit
ac0836f
1 Parent(s): 11abdb3

model: add new checkpoint for GC4 ELECTRA model

Browse files
.gitattributes CHANGED
@@ -14,3 +14,6 @@
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
 
 
 
 
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
17
+ *.meta filter=lfs diff=lfs merge=lfs -text
18
+ *.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
19
+ *.index filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "electra-base-gc4-64k-800000-cased-generator",
3
+ "architectures": [
4
+ "ElectraForMaskedLM"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "embedding_size": 768,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 256,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 1024,
13
+ "layer_norm_eps": 1e-12,
14
+ "max_position_embeddings": 512,
15
+ "model_type": "electra",
16
+ "num_attention_heads": 4,
17
+ "num_hidden_layers": 12,
18
+ "pad_token_id": 0,
19
+ "position_embedding_type": "absolute",
20
+ "summary_activation": "gelu",
21
+ "summary_last_dropout": 0.1,
22
+ "summary_type": "first",
23
+ "summary_use_proj": true,
24
+ "transformers_version": "4.6.0.dev0",
25
+ "type_vocab_size": 2,
26
+ "vocab_size": 64000
27
+ }
model.ckpt-800000.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0554a1121aa2a71953fc493e45e29fb51808f64a45d1079372952ac560b81111
3
+ size 1741572116
model.ckpt-800000.index ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:939c6540c047f3fb84263643b75a1a4ee2d8e6dc854981d88eadc0d9c7a54619
3
+ size 18022
model.ckpt-800000.meta ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d679f9acd303c3a0c4cd127d4227c99c6360be4e775034e2e128a4ed507f336
3
+ size 9227280
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11d137f4e358848794da5d48e9b7a6cabade8fbd190eb61a9043b09a80713188
3
+ size 238029732
tf_model.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d11e3a166357c309b90f22b612c5051beba32c0938e44ad5cd4aff6967d22d5
3
+ size 436414984