TheoLepere commited on
Commit
4121759
1 Parent(s): bbaa80a

Training in progress, epoch 1

Browse files
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:016e325e0314192719ae1dee3130b643b93fd287441c2e7c915b42f773513824
3
  size 442564533
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25860bf87d55f316d0238782181ffd1e179ee3e91005ea8356af4270bd936fc3
3
  size 442564533
runs/Apr26_09-50-02_6dc7f8a89189/1682502729.5273108/events.out.tfevents.1682502729.6dc7f8a89189.759.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e30c8fab9682dfd784881a5b29f2e5cef9939c24d157172f784b8127a2ecb78c
3
+ size 5861
runs/Apr26_09-50-02_6dc7f8a89189/events.out.tfevents.1682502729.6dc7f8a89189.759.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc66c26a7d628e60b0473948fdd52aa27a8580a932a5249d07baf3346d68fe9e
3
+ size 4456
special_tokens_map.json CHANGED
@@ -1,7 +1,19 @@
1
  {
2
- "cls_token": "[CLS]",
3
- "mask_token": "[MASK]",
4
- "pad_token": "[PAD]",
5
- "sep_token": "[SEP]",
6
- "unk_token": "[UNK]"
 
 
 
 
 
 
 
 
 
 
 
 
7
  }
 
1
  {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": {
10
+ "content": "<mask>",
11
+ "lstrip": true,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "<pad>",
17
+ "sep_token": "</s>",
18
+ "unk_token": "<unk>"
19
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,13 +1,23 @@
1
  {
 
 
 
 
 
2
  "clean_up_tokenization_spaces": true,
3
- "cls_token": "[CLS]",
4
- "do_lower_case": false,
5
- "mask_token": "[MASK]",
 
 
 
 
 
 
 
6
  "model_max_length": 512,
7
- "pad_token": "[PAD]",
8
- "sep_token": "[SEP]",
9
- "strip_accents": null,
10
- "tokenize_chinese_chars": true,
11
- "tokenizer_class": "DistilBertTokenizer",
12
- "unk_token": "[UNK]"
13
  }
 
1
  {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
  "clean_up_tokenization_spaces": true,
8
+ "cls_token": "<s>",
9
+ "eos_token": "</s>",
10
+ "mask_token": {
11
+ "__type": "AddedToken",
12
+ "content": "<mask>",
13
+ "lstrip": true,
14
+ "normalized": true,
15
+ "rstrip": false,
16
+ "single_word": false
17
+ },
18
  "model_max_length": 512,
19
+ "pad_token": "<pad>",
20
+ "sep_token": "</s>",
21
+ "tokenizer_class": "CamembertTokenizer",
22
+ "unk_token": "<unk>"
 
 
23
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a9dc36b69ba0a3f46b54f18eb48fbf057cd86af7ceea63a9fbb106102aeb6ba
3
  size 3579
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f430a9f7dc7f5b06bc1ff737392504d6e6b38eda177b320c4166e9de727f8fa
3
  size 3579