stefan-it commited on
Commit
d16f10c
1 Parent(s): ab62d88

model: add new checkpoint for GC4 ELECTRA model

Browse files
.gitattributes CHANGED
@@ -14,3 +14,6 @@
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
 
 
 
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
17
+ *.meta filter=lfs diff=lfs merge=lfs -text
18
+ *.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
19
+ *.index filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "electra-base-gc4-64k-800000-cased-discriminator",
3
+ "architectures": [
4
+ "ElectraForPreTraining"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "embedding_size": 768,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 768,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 3072,
13
+ "layer_norm_eps": 1e-12,
14
+ "max_position_embeddings": 512,
15
+ "model_type": "electra",
16
+ "num_attention_heads": 12,
17
+ "num_hidden_layers": 12,
18
+ "pad_token_id": 0,
19
+ "position_embedding_type": "absolute",
20
+ "summary_activation": "gelu",
21
+ "summary_last_dropout": 0.1,
22
+ "summary_type": "first",
23
+ "summary_use_proj": true,
24
+ "transformers_version": "4.6.0.dev0",
25
+ "type_vocab_size": 2,
26
+ "vocab_size": 64000
27
+ }
model.ckpt-800000.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0554a1121aa2a71953fc493e45e29fb51808f64a45d1079372952ac560b81111
3
+ size 1741572116
model.ckpt-800000.index ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:939c6540c047f3fb84263643b75a1a4ee2d8e6dc854981d88eadc0d9c7a54619
3
+ size 18022
model.ckpt-800000.meta ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d679f9acd303c3a0c4cd127d4227c99c6360be4e775034e2e128a4ed507f336
3
+ size 9227280
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41fdeab249f133e13bcc2af4cfef42303d8911abb25db010d840e3070200a1ff
3
+ size 540864329
tf_model.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6758bbc73762735176b8a359c1e4a582b7247c3e7025f992136799d0e17de25
3
+ size 541048720