Aunsiels commited on
Commit
4301c48
1 Parent(s): 213757c

Upload 10 files

Browse files
added_tokens.json CHANGED
@@ -1 +1 @@
1
- {"<BOS>": 28996, "<SEP>": 28998, "<PAD>": 28999, "<EOS>": 28997}
1
+ {"<BOS>": 28996, "<EOS>": 28997, "<SEP>": 28998, "<PAD>": 28999}
eval_results_mlm.txt CHANGED
@@ -1 +1 @@
1
- perplexity = 47.5140214816094
1
+ perplexity = 12.60146402572349
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2fbf5dab4a15412f879cef823c7c4640ff99951eadbf6f65cfd3e3376e18a82
3
- size 1334625493
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ecdd9b300ca2ba4ce5c93d4f500b9a58e8121a5501ba44d1ef1aef7ef3a4c16
3
+ size 1334625499
special_tokens_map.json CHANGED
@@ -1 +1 @@
1
- {"bos_token": "<BOS>", "eos_token": "<EOS>", "unk_token": "[UNK]", "sep_token": "<SEP>", "pad_token": "<PAD>", "cls_token": "[CLS]", "mask_token": "[MASK]"}
1
+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"do_lower_case": false, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "bert-large-cased"}
1
+ {"do_lower_case": false, "do_basic_tokenize": true, "never_split": null, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "bert-large-cased", "tokenizer_class": "BertTokenizer"}
train_results.txt CHANGED
@@ -1,11 +1,11 @@
1
- epoch = 10.0
2
- init_mem_cpu_alloc_delta = 1168576512
3
- init_mem_cpu_peaked_delta = 1323925504
4
  init_mem_gpu_alloc_delta = 1335215616
5
  init_mem_gpu_peaked_delta = 0
6
- train_mem_cpu_alloc_delta = 54071296
7
- train_mem_cpu_peaked_delta = 356077568
8
  train_mem_gpu_alloc_delta = 4003456000
9
  train_mem_gpu_peaked_delta = 19106743296
10
- train_runtime = 980.3735
11
- train_samples_per_second = 0.785
1
+ epoch = 1.0
2
+ init_mem_cpu_alloc_delta = 1168203776
3
+ init_mem_cpu_peaked_delta = 1324277760
4
  init_mem_gpu_alloc_delta = 1335215616
5
  init_mem_gpu_peaked_delta = 0
6
+ train_mem_cpu_alloc_delta = 31993856
7
+ train_mem_cpu_peaked_delta = 0
8
  train_mem_gpu_alloc_delta = 4003456000
9
  train_mem_gpu_peaked_delta = 19106743296
10
+ train_runtime = 81.7708
11
+ train_samples_per_second = 0.942
trainer_state.json CHANGED
@@ -1,29 +1,23 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 10.0,
5
- "global_step": 770,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 6.49,
12
- "learning_rate": 3.506493506493507e-08,
13
- "loss": 4.2363,
14
- "step": 500
15
- },
16
- {
17
- "epoch": 10.0,
18
- "step": 770,
19
- "total_flos": 6282413018234880.0,
20
- "train_runtime": 980.3735,
21
- "train_samples_per_second": 0.785
22
  }
23
  ],
24
- "max_steps": 770,
25
- "num_train_epochs": 10,
26
- "total_flos": 6282413018234880.0,
27
  "trial_name": null,
28
  "trial_params": null
29
  }
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0,
5
+ "global_step": 77,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 1.0,
12
+ "step": 77,
13
+ "total_flos": 628241301823488.0,
14
+ "train_runtime": 81.7708,
15
+ "train_samples_per_second": 0.942
 
 
 
 
 
 
16
  }
17
  ],
18
+ "max_steps": 77,
19
+ "num_train_epochs": 1,
20
+ "total_flos": 628241301823488.0,
21
  "trial_name": null,
22
  "trial_params": null
23
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4d1f848dbe017c8469705d9ef92d62e3ed52b8479d6f13ba39a024dac0c5229
3
- size 2415
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3d6af5026a1064f813958e7381618040be16d76b31c206f97f2cc7eb0afdcc1
3
+ size 2351