Training in progress, epoch 1
Browse files- .gitignore +1 -0
- config.json +30 -0
- logs/1714006907.533991/events.out.tfevents.1714006907.persepolis.83624.1 +3 -0
- logs/1714007004.458195/events.out.tfevents.1714007004.persepolis.67148.1 +3 -0
- logs/1714007123.0655115/events.out.tfevents.1714007123.persepolis.81164.1 +3 -0
- logs/1714007706.9180722/events.out.tfevents.1714007706.persepolis.81164.3 +3 -0
- logs/1714007874.0225153/events.out.tfevents.1714007874.persepolis.81164.5 +3 -0
- logs/1714007994.3851368/events.out.tfevents.1714007994.persepolis.81660.1 +3 -0
- logs/1714011006.6806612/events.out.tfevents.1714011006.persepolis.81488.1 +3 -0
- logs/1714011229.5143385/events.out.tfevents.1714011229.persepolis.80352.1 +3 -0
- logs/1714011861.966598/events.out.tfevents.1714011861.persepolis.80352.4 +3 -0
- logs/1714012923.067573/events.out.tfevents.1714012923.persepolis.80352.6 +3 -0
- logs/1714017504.8640153/events.out.tfevents.1714017504.persepolis.56460.1 +3 -0
- logs/events.out.tfevents.1714006907.persepolis.83624.0 +3 -0
- logs/events.out.tfevents.1714007004.persepolis.67148.0 +3 -0
- logs/events.out.tfevents.1714007123.persepolis.81164.0 +3 -0
- logs/events.out.tfevents.1714007706.persepolis.81164.2 +3 -0
- logs/events.out.tfevents.1714007874.persepolis.81164.4 +3 -0
- logs/events.out.tfevents.1714007994.persepolis.81660.0 +3 -0
- logs/events.out.tfevents.1714011006.persepolis.81488.0 +3 -0
- logs/events.out.tfevents.1714011229.persepolis.80352.0 +3 -0
- logs/events.out.tfevents.1714011795.persepolis.80352.2 +3 -0
- logs/events.out.tfevents.1714011861.persepolis.80352.3 +3 -0
- logs/events.out.tfevents.1714012923.persepolis.80352.5 +3 -0
- logs/events.out.tfevents.1714017504.persepolis.56460.0 +3 -0
- pytorch_model.bin +3 -0
- special_tokens_map.json +7 -0
- tokenizer.json +0 -0
- tokenizer_config.json +15 -0
- training_args.bin +3 -0
- vocab.txt +0 -0
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "google/electra-small-discriminator",
|
3 |
+
"architectures": [
|
4 |
+
"ElectraForQuestionAnswering"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"embedding_size": 128,
|
9 |
+
"hidden_act": "gelu",
|
10 |
+
"hidden_dropout_prob": 0.1,
|
11 |
+
"hidden_size": 256,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 1024,
|
14 |
+
"layer_norm_eps": 1e-12,
|
15 |
+
"max_position_embeddings": 512,
|
16 |
+
"model_type": "electra",
|
17 |
+
"num_attention_heads": 4,
|
18 |
+
"num_hidden_layers": 12,
|
19 |
+
"pad_token_id": 0,
|
20 |
+
"position_embedding_type": "absolute",
|
21 |
+
"summary_activation": "gelu",
|
22 |
+
"summary_last_dropout": 0.1,
|
23 |
+
"summary_type": "first",
|
24 |
+
"summary_use_proj": true,
|
25 |
+
"torch_dtype": "float32",
|
26 |
+
"transformers_version": "4.28.1",
|
27 |
+
"type_vocab_size": 2,
|
28 |
+
"use_cache": true,
|
29 |
+
"vocab_size": 30522
|
30 |
+
}
|
logs/1714006907.533991/events.out.tfevents.1714006907.persepolis.83624.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6670812c0c81c31ff945f89d10da028709ee4bbeac91445f93ca150e03ccb4ff
|
3 |
+
size 5901
|
logs/1714007004.458195/events.out.tfevents.1714007004.persepolis.67148.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae0d31aa959e5cc2fbb764f8a07dbaafa0f141541035d39a6b7cb03c435e45fe
|
3 |
+
size 5901
|
logs/1714007123.0655115/events.out.tfevents.1714007123.persepolis.81164.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d877577758e972c4279523d6ab50ae2e4978e54a870691653809adec49df1e1
|
3 |
+
size 5901
|
logs/1714007706.9180722/events.out.tfevents.1714007706.persepolis.81164.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10708555025451ef7b939c558c6da286fd21be1cf95bafd391af029388a79bae
|
3 |
+
size 5901
|
logs/1714007874.0225153/events.out.tfevents.1714007874.persepolis.81164.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00eb32aa0b61070893a343b59b737adc35655e0b3d1db0adb17c84180112f63f
|
3 |
+
size 5901
|
logs/1714007994.3851368/events.out.tfevents.1714007994.persepolis.81660.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fad2573405cb76ebd1633cc3f333566ed8bfa3f840c66728e94c7753e07a8545
|
3 |
+
size 5901
|
logs/1714011006.6806612/events.out.tfevents.1714011006.persepolis.81488.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:befaa8f8a0022a0d691ffdf7e0be591746c764392de8d0524bcc17e854e0c6be
|
3 |
+
size 5901
|
logs/1714011229.5143385/events.out.tfevents.1714011229.persepolis.80352.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b0a9501e819d48a98663b8776045d2bc31ce3562dc3dec80d2aa4c8e75e58b5
|
3 |
+
size 5901
|
logs/1714011861.966598/events.out.tfevents.1714011861.persepolis.80352.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4217720b431c5ce4a1c49cdf5f05b9908567770d9ae625d6eda73fc107b8488
|
3 |
+
size 5898
|
logs/1714012923.067573/events.out.tfevents.1714012923.persepolis.80352.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6f3a5aced0965d404ba4f50d3fad5fbcc14633ec62405acaaf787af23a7c9da
|
3 |
+
size 5891
|
logs/1714017504.8640153/events.out.tfevents.1714017504.persepolis.56460.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd64dd0c7800d63f5efe00e9652eec65f7e895c61f53b6bb5ddc1ed6dc42e771
|
3 |
+
size 5888
|
logs/events.out.tfevents.1714006907.persepolis.83624.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b00b94baddb977e91949de6389a110dc29ccda2fe162e952baef42d5c00160f6
|
3 |
+
size 4165
|
logs/events.out.tfevents.1714007004.persepolis.67148.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d523a5cad3012f2d6f9531629e0f9e720313329e15d3a909f405bec888aaa573
|
3 |
+
size 4165
|
logs/events.out.tfevents.1714007123.persepolis.81164.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64e294c0a5553eee7f1730261d651c3b38a10a78876b281a458f6f7cd1b95d8e
|
3 |
+
size 4144
|
logs/events.out.tfevents.1714007706.persepolis.81164.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02cf61789679c58d441f20b613fc95a11178df033ed08115d7025c2db8912325
|
3 |
+
size 4144
|
logs/events.out.tfevents.1714007874.persepolis.81164.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1a4fd386976f7c1c2b8e2a1a953d6e3a24be07d8b4f0e84dca7a438fe444821
|
3 |
+
size 4144
|
logs/events.out.tfevents.1714007994.persepolis.81660.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:033236c388713db561f079a0db52788a0ed8f3d896d6916b8a9aa6af08e62949
|
3 |
+
size 4144
|
logs/events.out.tfevents.1714011006.persepolis.81488.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0888f5ba1db01391c7553d9be0d4d6fe10fae33678c7bfc10dcf737f384f41d
|
3 |
+
size 4144
|
logs/events.out.tfevents.1714011229.persepolis.80352.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58912f7fbec944059ad36bbb96240dd4475b8ee85804f8432b48968017e240dd
|
3 |
+
size 4298
|
logs/events.out.tfevents.1714011795.persepolis.80352.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d96fed7ce9517d20194aaa80ed24b1d990db3482c7077bb209e925a819d7ad3a
|
3 |
+
size 88
|
logs/events.out.tfevents.1714011861.persepolis.80352.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:465233e4d8684256b05bff0d798b93af53d4fa8e16f2282bdca21b04b5711773
|
3 |
+
size 4295
|
logs/events.out.tfevents.1714012923.persepolis.80352.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69dfae8e915615a73a9b8fcb574667dc781f3672ecfc3a39a29e6369e2f6543b
|
3 |
+
size 4296
|
logs/events.out.tfevents.1714017504.persepolis.56460.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73f17e93f0b35621dab340e411b01eed192d4b6f300a1c862705344234803c9d
|
3 |
+
size 4294
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1933674f0d2bc165ab6c0dba9c3cc49377f922321132b44a05f1589fbf0503e
|
3 |
+
size 54007922
|
special_tokens_map.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"mask_token": "[MASK]",
|
4 |
+
"pad_token": "[PAD]",
|
5 |
+
"sep_token": "[SEP]",
|
6 |
+
"unk_token": "[UNK]"
|
7 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"clean_up_tokenization_spaces": true,
|
3 |
+
"cls_token": "[CLS]",
|
4 |
+
"do_basic_tokenize": true,
|
5 |
+
"do_lower_case": true,
|
6 |
+
"mask_token": "[MASK]",
|
7 |
+
"model_max_length": 512,
|
8 |
+
"never_split": null,
|
9 |
+
"pad_token": "[PAD]",
|
10 |
+
"sep_token": "[SEP]",
|
11 |
+
"strip_accents": null,
|
12 |
+
"tokenize_chinese_chars": true,
|
13 |
+
"tokenizer_class": "ElectraTokenizer",
|
14 |
+
"unk_token": "[UNK]"
|
15 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f19cdee513c9952f3a4fa8e73b256db061c2cc17a7fdaddaa48320883157d09
|
3 |
+
size 4280
|
vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|