Fill-Mask
PyTorch
TensorFlow
JAX
Transformers
multilingual
af
am
ar
as
az
be
bg
bn
br
bs
ca
cs
cy
da
de
el
en
eo
es
et
eu
fa
fi
fr
fy
ga
gd
gl
gu
ha
he
hi
hr
hu
hy
id
is
it
ja
jv
ka
kk
km
kn
ko
ku
ky
la
lo
lt
lv
mg
mk
ml
mn
mr
ms
my
ne
nl
no
om
or
pa
pl
ps
pt
ro
ru
sa
sd
si
sk
sl
so
sq
sr
su
sv
sw
ta
te
th
tl
tr
ug
uk
ur
uz
vi
xh
yi
zh
mit
xlm-roberta
exbert
AutoTrain Compatible
add flax model
Browse files- .ipynb_checkpoints/config-checkpoint.json +25 -0
- config.json +3 -0
- flax_model.msgpack +3 -0
.ipynb_checkpoints/config-checkpoint.json
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"XLMRobertaForMaskedLM"
|
4 |
+
],
|
5 |
+
"attention_probs_dropout_prob": 0.1,
|
6 |
+
"bos_token_id": 0,
|
7 |
+
"eos_token_id": 2,
|
8 |
+
"hidden_act": "gelu",
|
9 |
+
"hidden_dropout_prob": 0.1,
|
10 |
+
"hidden_size": 768,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 3072,
|
13 |
+
"layer_norm_eps": 1e-05,
|
14 |
+
"max_position_embeddings": 514,
|
15 |
+
"model_type": "xlm-roberta",
|
16 |
+
"num_attention_heads": 12,
|
17 |
+
"num_hidden_layers": 12,
|
18 |
+
"output_past": true,
|
19 |
+
"pad_token_id": 1,
|
20 |
+
"position_embedding_type": "absolute",
|
21 |
+
"transformers_version": "4.17.0.dev0",
|
22 |
+
"type_vocab_size": 1,
|
23 |
+
"use_cache": true,
|
24 |
+
"vocab_size": 250002
|
25 |
+
}
|
config.json
CHANGED
@@ -17,6 +17,9 @@
|
|
17 |
"num_hidden_layers": 12,
|
18 |
"output_past": true,
|
19 |
"pad_token_id": 1,
|
|
|
|
|
20 |
"type_vocab_size": 1,
|
|
|
21 |
"vocab_size": 250002
|
22 |
}
|
17 |
"num_hidden_layers": 12,
|
18 |
"output_past": true,
|
19 |
"pad_token_id": 1,
|
20 |
+
"position_embedding_type": "absolute",
|
21 |
+
"transformers_version": "4.17.0.dev0",
|
22 |
"type_vocab_size": 1,
|
23 |
+
"use_cache": true,
|
24 |
"vocab_size": 250002
|
25 |
}
|
flax_model.msgpack
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:311b6941e02128b01c6a429f55b47b351a86fe53e6802774d87696bcbc465992
|
3 |
+
size 1113187999
|