domenicrosati commited on
Commit
1e6fdbb
1 Parent(s): 482ab65

Training in progress, step 500

Browse files
config.json CHANGED
@@ -46,7 +46,7 @@
46
  "length_penalty": 2.0,
47
  "max_decoder_position_embeddings": 1024,
48
  "max_encoder_position_embeddings": 16384,
49
- "max_length": 1024,
50
  "min_length": 100,
51
  "model_type": "led",
52
  "no_repeat_ngram_size": 3,
@@ -54,7 +54,7 @@
54
  "num_hidden_layers": 6,
55
  "pad_token_id": 1,
56
  "torch_dtype": "float32",
57
- "transformers_version": "4.26.0",
58
  "use_cache": true,
59
  "vocab_size": 50265
60
  }
 
46
  "length_penalty": 2.0,
47
  "max_decoder_position_embeddings": 1024,
48
  "max_encoder_position_embeddings": 16384,
49
+ "max_length": 1536,
50
  "min_length": 100,
51
  "model_type": "led",
52
  "no_repeat_ngram_size": 3,
 
54
  "num_hidden_layers": 6,
55
  "pad_token_id": 1,
56
  "torch_dtype": "float32",
57
+ "transformers_version": "4.38.1",
58
  "use_cache": true,
59
  "vocab_size": 50265
60
  }
merges.txt CHANGED
@@ -1,4 +1,4 @@
1
- #version: 0.2 - Trained by `huggingface/tokenizers`
2
  Ġ t
3
  Ġ a
4
  h e
 
1
+ #version: 0.2
2
  Ġ t
3
  Ġ a
4
  h e
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4e19c7337a31068978eba7446fe6d2a79cba4879f35d507fbdab6ac02fed3e2
3
+ size 647614116
runs/Mar05_17-11-11_0fc7b813a713/events.out.tfevents.1709658672.0fc7b813a713.13040.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0123420214e8c29edc3ed8d15157bf6ddf0a9cd38e53cbbf27156ee823997de
3
+ size 5450
runs/Mar05_17-18-59_0fc7b813a713/events.out.tfevents.1709659140.0fc7b813a713.15099.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf291a7a3febe4ffc967eddafc14747e98eba634d712ae2777c6756b7022eed8
3
+ size 5450
runs/Mar05_17-26-54_0fc7b813a713/events.out.tfevents.1709659615.0fc7b813a713.17094.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0bc8417fdde40eef01ec7f242c061e2e6645cfc62d5d8bb9737e034164c392e
3
+ size 5450
runs/Mar05_17-32-36_0fc7b813a713/events.out.tfevents.1709659957.0fc7b813a713.18609.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96d6e859b9a4da645b7218aed2ebe1a119d24320213829b9859bec581ce03601
3
+ size 5450
runs/Mar06_10-48-15_4bccddc6ef10/events.out.tfevents.1709722097.4bccddc6ef10.3444.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a904959eb7c73629883df7e98cdba40f71f9396cefd0c00e3280660bdfe2606
3
+ size 5450
runs/Mar06_10-53-47_4bccddc6ef10/events.out.tfevents.1709722428.4bccddc6ef10.5142.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:002d9e33738550c6f656ef580387c5c5a52e2eea36bbfd5b0573b5a4a31cf7ab
3
+ size 5450
runs/Mar06_11-00-28_4bccddc6ef10/events.out.tfevents.1709722829.4bccddc6ef10.6983.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34b0c7bd256521801f012ee2d8f256905f06a704f20ee354f22cea51d2ccf5f6
3
+ size 5660
runs/Mar06_11-17-54_4bccddc6ef10/events.out.tfevents.1709723875.4bccddc6ef10.11365.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21678f46f72b2ab83c9abd34281d56925f87451bf9bb1ce6aa8d503c8b8e6e09
3
+ size 88
runs/Mar06_11-22-45_4bccddc6ef10/events.out.tfevents.1709724166.4bccddc6ef10.12632.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7a111ff8d498bdc134a7bc3f37d826f7bc00eeb3f71045845ae3e492b881173
3
+ size 6134
tokenizer.json CHANGED
@@ -96,6 +96,7 @@
96
  "continuing_subword_prefix": "",
97
  "end_of_word_suffix": "",
98
  "fuse_unk": false,
 
99
  "vocab": {
100
  "<s>": 0,
101
  "<pad>": 1,
 
96
  "continuing_subword_prefix": "",
97
  "end_of_word_suffix": "",
98
  "fuse_unk": false,
99
+ "byte_fallback": false,
100
  "vocab": {
101
  "<s>": 0,
102
  "<pad>": 1,
tokenizer_config.json CHANGED
@@ -1,65 +1,57 @@
1
  {
2
  "add_prefix_space": false,
3
- "bos_token": {
4
- "__type": "AddedToken",
5
- "content": "<s>",
6
- "lstrip": false,
7
- "normalized": true,
8
- "rstrip": false,
9
- "single_word": false
10
- },
11
- "cls_token": {
12
- "__type": "AddedToken",
13
- "content": "<s>",
14
- "lstrip": false,
15
- "normalized": true,
16
- "rstrip": false,
17
- "single_word": false
18
- },
19
- "eos_token": {
20
- "__type": "AddedToken",
21
- "content": "</s>",
22
- "lstrip": false,
23
- "normalized": true,
24
- "rstrip": false,
25
- "single_word": false
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  },
 
 
 
 
27
  "errors": "replace",
28
- "mask_token": {
29
- "__type": "AddedToken",
30
- "content": "<mask>",
31
- "lstrip": true,
32
- "normalized": true,
33
- "rstrip": false,
34
- "single_word": false
35
- },
36
  "model_max_length": 16384,
37
- "name_or_path": "allenai/led-base-16384",
38
- "pad_token": {
39
- "__type": "AddedToken",
40
- "content": "<pad>",
41
- "lstrip": false,
42
- "normalized": true,
43
- "rstrip": false,
44
- "single_word": false
45
- },
46
- "sep_token": {
47
- "__type": "AddedToken",
48
- "content": "</s>",
49
- "lstrip": false,
50
- "normalized": true,
51
- "rstrip": false,
52
- "single_word": false
53
- },
54
- "special_tokens_map_file": "/home/domenic/projects/def-pmongeon/domenic/models--allenai--led-base-16384/snapshots/38335783885b338d93791936c54bb4be46bebed9/special_tokens_map.json",
55
  "tokenizer_class": "LEDTokenizer",
56
  "trim_offsets": true,
57
- "unk_token": {
58
- "__type": "AddedToken",
59
- "content": "<unk>",
60
- "lstrip": false,
61
- "normalized": true,
62
- "rstrip": false,
63
- "single_word": false
64
- }
65
  }
 
1
  {
2
  "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "<s>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "<pad>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "</s>",
22
+ "lstrip": false,
23
+ "normalized": true,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "3": {
29
+ "content": "<unk>",
30
+ "lstrip": false,
31
+ "normalized": true,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "50264": {
37
+ "content": "<mask>",
38
+ "lstrip": true,
39
+ "normalized": true,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ }
44
  },
45
+ "bos_token": "<s>",
46
+ "clean_up_tokenization_spaces": true,
47
+ "cls_token": "<s>",
48
+ "eos_token": "</s>",
49
  "errors": "replace",
50
+ "mask_token": "<mask>",
 
 
 
 
 
 
 
51
  "model_max_length": 16384,
52
+ "pad_token": "<pad>",
53
+ "sep_token": "</s>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
54
  "tokenizer_class": "LEDTokenizer",
55
  "trim_offsets": true,
56
+ "unk_token": "<unk>"
 
 
 
 
 
 
 
57
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7ed3c1f15892051c1c3b540c0020e55e55028b1ac8ce9583d8e02371dadd51e
3
- size 3707
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbc9f26db116a8eaa41621fbb35f5921831e00561bedf6141051ae49cf2c5f12
3
+ size 5112