kasohrab commited on
Commit
a764737
1 Parent(s): e77488d

Training in progress, epoch 1

Browse files
Files changed (31) hide show
  1. .gitignore +1 -0
  2. config.json +30 -0
  3. logs/1714006907.533991/events.out.tfevents.1714006907.persepolis.83624.1 +3 -0
  4. logs/1714007004.458195/events.out.tfevents.1714007004.persepolis.67148.1 +3 -0
  5. logs/1714007123.0655115/events.out.tfevents.1714007123.persepolis.81164.1 +3 -0
  6. logs/1714007706.9180722/events.out.tfevents.1714007706.persepolis.81164.3 +3 -0
  7. logs/1714007874.0225153/events.out.tfevents.1714007874.persepolis.81164.5 +3 -0
  8. logs/1714007994.3851368/events.out.tfevents.1714007994.persepolis.81660.1 +3 -0
  9. logs/1714011006.6806612/events.out.tfevents.1714011006.persepolis.81488.1 +3 -0
  10. logs/1714011229.5143385/events.out.tfevents.1714011229.persepolis.80352.1 +3 -0
  11. logs/1714011861.966598/events.out.tfevents.1714011861.persepolis.80352.4 +3 -0
  12. logs/1714012923.067573/events.out.tfevents.1714012923.persepolis.80352.6 +3 -0
  13. logs/1714017504.8640153/events.out.tfevents.1714017504.persepolis.56460.1 +3 -0
  14. logs/events.out.tfevents.1714006907.persepolis.83624.0 +3 -0
  15. logs/events.out.tfevents.1714007004.persepolis.67148.0 +3 -0
  16. logs/events.out.tfevents.1714007123.persepolis.81164.0 +3 -0
  17. logs/events.out.tfevents.1714007706.persepolis.81164.2 +3 -0
  18. logs/events.out.tfevents.1714007874.persepolis.81164.4 +3 -0
  19. logs/events.out.tfevents.1714007994.persepolis.81660.0 +3 -0
  20. logs/events.out.tfevents.1714011006.persepolis.81488.0 +3 -0
  21. logs/events.out.tfevents.1714011229.persepolis.80352.0 +3 -0
  22. logs/events.out.tfevents.1714011795.persepolis.80352.2 +3 -0
  23. logs/events.out.tfevents.1714011861.persepolis.80352.3 +3 -0
  24. logs/events.out.tfevents.1714012923.persepolis.80352.5 +3 -0
  25. logs/events.out.tfevents.1714017504.persepolis.56460.0 +3 -0
  26. pytorch_model.bin +3 -0
  27. special_tokens_map.json +7 -0
  28. tokenizer.json +0 -0
  29. tokenizer_config.json +15 -0
  30. training_args.bin +3 -0
  31. vocab.txt +0 -0
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "google/electra-small-discriminator",
3
+ "architectures": [
4
+ "ElectraForQuestionAnswering"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "embedding_size": 128,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 256,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 1024,
14
+ "layer_norm_eps": 1e-12,
15
+ "max_position_embeddings": 512,
16
+ "model_type": "electra",
17
+ "num_attention_heads": 4,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 0,
20
+ "position_embedding_type": "absolute",
21
+ "summary_activation": "gelu",
22
+ "summary_last_dropout": 0.1,
23
+ "summary_type": "first",
24
+ "summary_use_proj": true,
25
+ "torch_dtype": "float32",
26
+ "transformers_version": "4.28.1",
27
+ "type_vocab_size": 2,
28
+ "use_cache": true,
29
+ "vocab_size": 30522
30
+ }
logs/1714006907.533991/events.out.tfevents.1714006907.persepolis.83624.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6670812c0c81c31ff945f89d10da028709ee4bbeac91445f93ca150e03ccb4ff
3
+ size 5901
logs/1714007004.458195/events.out.tfevents.1714007004.persepolis.67148.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae0d31aa959e5cc2fbb764f8a07dbaafa0f141541035d39a6b7cb03c435e45fe
3
+ size 5901
logs/1714007123.0655115/events.out.tfevents.1714007123.persepolis.81164.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d877577758e972c4279523d6ab50ae2e4978e54a870691653809adec49df1e1
3
+ size 5901
logs/1714007706.9180722/events.out.tfevents.1714007706.persepolis.81164.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10708555025451ef7b939c558c6da286fd21be1cf95bafd391af029388a79bae
3
+ size 5901
logs/1714007874.0225153/events.out.tfevents.1714007874.persepolis.81164.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00eb32aa0b61070893a343b59b737adc35655e0b3d1db0adb17c84180112f63f
3
+ size 5901
logs/1714007994.3851368/events.out.tfevents.1714007994.persepolis.81660.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fad2573405cb76ebd1633cc3f333566ed8bfa3f840c66728e94c7753e07a8545
3
+ size 5901
logs/1714011006.6806612/events.out.tfevents.1714011006.persepolis.81488.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:befaa8f8a0022a0d691ffdf7e0be591746c764392de8d0524bcc17e854e0c6be
3
+ size 5901
logs/1714011229.5143385/events.out.tfevents.1714011229.persepolis.80352.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b0a9501e819d48a98663b8776045d2bc31ce3562dc3dec80d2aa4c8e75e58b5
3
+ size 5901
logs/1714011861.966598/events.out.tfevents.1714011861.persepolis.80352.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4217720b431c5ce4a1c49cdf5f05b9908567770d9ae625d6eda73fc107b8488
3
+ size 5898
logs/1714012923.067573/events.out.tfevents.1714012923.persepolis.80352.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6f3a5aced0965d404ba4f50d3fad5fbcc14633ec62405acaaf787af23a7c9da
3
+ size 5891
logs/1714017504.8640153/events.out.tfevents.1714017504.persepolis.56460.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd64dd0c7800d63f5efe00e9652eec65f7e895c61f53b6bb5ddc1ed6dc42e771
3
+ size 5888
logs/events.out.tfevents.1714006907.persepolis.83624.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b00b94baddb977e91949de6389a110dc29ccda2fe162e952baef42d5c00160f6
3
+ size 4165
logs/events.out.tfevents.1714007004.persepolis.67148.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d523a5cad3012f2d6f9531629e0f9e720313329e15d3a909f405bec888aaa573
3
+ size 4165
logs/events.out.tfevents.1714007123.persepolis.81164.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64e294c0a5553eee7f1730261d651c3b38a10a78876b281a458f6f7cd1b95d8e
3
+ size 4144
logs/events.out.tfevents.1714007706.persepolis.81164.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02cf61789679c58d441f20b613fc95a11178df033ed08115d7025c2db8912325
3
+ size 4144
logs/events.out.tfevents.1714007874.persepolis.81164.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1a4fd386976f7c1c2b8e2a1a953d6e3a24be07d8b4f0e84dca7a438fe444821
3
+ size 4144
logs/events.out.tfevents.1714007994.persepolis.81660.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:033236c388713db561f079a0db52788a0ed8f3d896d6916b8a9aa6af08e62949
3
+ size 4144
logs/events.out.tfevents.1714011006.persepolis.81488.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0888f5ba1db01391c7553d9be0d4d6fe10fae33678c7bfc10dcf737f384f41d
3
+ size 4144
logs/events.out.tfevents.1714011229.persepolis.80352.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58912f7fbec944059ad36bbb96240dd4475b8ee85804f8432b48968017e240dd
3
+ size 4298
logs/events.out.tfevents.1714011795.persepolis.80352.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d96fed7ce9517d20194aaa80ed24b1d990db3482c7077bb209e925a819d7ad3a
3
+ size 88
logs/events.out.tfevents.1714011861.persepolis.80352.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:465233e4d8684256b05bff0d798b93af53d4fa8e16f2282bdca21b04b5711773
3
+ size 4295
logs/events.out.tfevents.1714012923.persepolis.80352.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69dfae8e915615a73a9b8fcb574667dc781f3672ecfc3a39a29e6369e2f6543b
3
+ size 4296
logs/events.out.tfevents.1714017504.persepolis.56460.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73f17e93f0b35621dab340e411b01eed192d4b6f300a1c862705344234803c9d
3
+ size 4294
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1933674f0d2bc165ab6c0dba9c3cc49377f922321132b44a05f1589fbf0503e
3
+ size 54007922
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "clean_up_tokenization_spaces": true,
3
+ "cls_token": "[CLS]",
4
+ "do_basic_tokenize": true,
5
+ "do_lower_case": true,
6
+ "mask_token": "[MASK]",
7
+ "model_max_length": 512,
8
+ "never_split": null,
9
+ "pad_token": "[PAD]",
10
+ "sep_token": "[SEP]",
11
+ "strip_accents": null,
12
+ "tokenize_chinese_chars": true,
13
+ "tokenizer_class": "ElectraTokenizer",
14
+ "unk_token": "[UNK]"
15
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f19cdee513c9952f3a4fa8e73b256db061c2cc17a7fdaddaa48320883157d09
3
+ size 4280
vocab.txt ADDED
The diff for this file is too large to render. See raw diff