Aleksandra commited on
Commit
1574d5c
1 Parent(s): 73502c1

Training in progress, step 500

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "allegro/herbert-base-cased",
3
+ "architectures": [
4
+ "BertForQuestionAnswering"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 768,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 3072,
13
+ "layer_norm_eps": 1e-12,
14
+ "max_position_embeddings": 514,
15
+ "model_type": "bert",
16
+ "num_attention_heads": 12,
17
+ "num_hidden_layers": 12,
18
+ "pad_token_id": 1,
19
+ "position_embedding_type": "absolute",
20
+ "tokenizer_class": "HerbertTokenizerFast",
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.15.0",
23
+ "type_vocab_size": 2,
24
+ "use_cache": true,
25
+ "vocab_size": 50000
26
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d655f411a06fbecbbc71188176642c04f3f18fd7ecbc49c87b3b2537733c562
3
+ size 495498737
runs/Jan20_12-34-32_5ec4d896b877/1642682111.6865454/events.out.tfevents.1642682111.5ec4d896b877.72.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa3a74408ef5bb734cf88311acdad1f508ac0ca87e346c65469f6359bdaf41e7
3
+ size 4779
runs/Jan20_12-34-32_5ec4d896b877/events.out.tfevents.1642682111.5ec4d896b877.72.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:740c61b64e59f29fb1890dae5395240926c8f83dcaaf732fe22ade770190df3d
3
+ size 4034
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "unk_token": "<unk>", "sep_token": "</s>", "pad_token": "<pad>", "cls_token": "<s>", "mask_token": "<mask>"}
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"cls_token": "<s>", "unk_token": "<unk>", "pad_token": "<pad>", "mask_token": "<mask>", "sep_token": "</s>", "do_lowercase_and_remove_accent": false, "bos_token": "<s>", "additional_special_tokens": [], "model_max_length": 512, "special_tokens_map_file": "/root/.cache/huggingface/transformers/a77c29d6c21e653166565b0d51ea0a46b918191512e0ae894422060267a0f436.b8e113717eb1828d09e47de853cf49c8fad05ebdce24df2614cd942dc23e2a77", "name_or_path": "allegro/herbert-base-cased", "lang2id": null, "id2lang": null, "tokenizer_class": "HerbertTokenizer"}
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0979f01b6f084176da14399e0f6f7cdb574772c1c1c323ffbdcab13c96841ed4
3
+ size 2991
vocab.json ADDED
The diff for this file is too large to render. See raw diff