obudzecie commited on
Commit
6c7d00a
1 Parent(s): fb831dd

Training in progress, epoch 2

Browse files
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc03d6730cedf94c065cccb684601215248ed70177281b48f84551c77862f299
3
  size 98725415
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a86f1bda26ad1640354bf6c188d80244a7f5f2b6694b2012f67143f6edbdaed7
3
  size 98725415
run-4/checkpoint-214/config.json CHANGED
@@ -24,7 +24,7 @@
24
  "pad_token_id": 0,
25
  "problem_type": "single_label_classification",
26
  "torch_dtype": "float32",
27
- "transformers_version": "4.38.2",
28
  "trigram_input": true,
29
  "true_hidden_size": 128,
30
  "type_vocab_size": 2,
 
24
  "pad_token_id": 0,
25
  "problem_type": "single_label_classification",
26
  "torch_dtype": "float32",
27
+ "transformers_version": "4.27.2",
28
  "trigram_input": true,
29
  "true_hidden_size": 128,
30
  "type_vocab_size": 2,
run-4/checkpoint-214/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4fdbf96832c06e52bb8b1cde816e42cfad4a0757faf8bd66785932f6b7fb0d06
3
- size 197593757
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8a32cd30cf33bbf1b108a26d3d75ea9840ac3185d314d19bfbbaadb45d4f804
3
+ size 197314895
run-4/checkpoint-214/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22549d8b7cdd063e2742ba38507f50641316f8e06710e574d061547c35ed8c7b
3
- size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89eb09fce7bbf8122a2c597fc54308b6b95066415fc5d099681a8e68d19f4869
3
+ size 14575
run-4/checkpoint-214/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51c2aa66da65c248eea02a8e8f0b50cf1f7ae270c245373af6ebf25ec8a644b5
3
- size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88668f3a4e695b514f2a6547cc3d5ecbea753cfa5e4fad0bb9d8f868327d0bd1
3
+ size 627
run-4/checkpoint-214/tokenizer_config.json CHANGED
@@ -1,53 +1,11 @@
1
  {
2
- "added_tokens_decoder": {
3
- "0": {
4
- "content": "[PAD]",
5
- "lstrip": false,
6
- "normalized": false,
7
- "rstrip": false,
8
- "single_word": false,
9
- "special": true
10
- },
11
- "100": {
12
- "content": "[UNK]",
13
- "lstrip": false,
14
- "normalized": false,
15
- "rstrip": false,
16
- "single_word": false,
17
- "special": true
18
- },
19
- "101": {
20
- "content": "[CLS]",
21
- "lstrip": false,
22
- "normalized": false,
23
- "rstrip": false,
24
- "single_word": false,
25
- "special": true
26
- },
27
- "102": {
28
- "content": "[SEP]",
29
- "lstrip": false,
30
- "normalized": false,
31
- "rstrip": false,
32
- "single_word": false,
33
- "special": true
34
- },
35
- "103": {
36
- "content": "[MASK]",
37
- "lstrip": false,
38
- "normalized": false,
39
- "rstrip": false,
40
- "single_word": false,
41
- "special": true
42
- }
43
- },
44
- "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
46
  "do_lower_case": true,
47
  "mask_token": "[MASK]",
48
  "model_max_length": 1000000000000000019884624838656,
49
  "pad_token": "[PAD]",
50
  "sep_token": "[SEP]",
 
51
  "strip_accents": null,
52
  "tokenize_chinese_chars": true,
53
  "tokenizer_class": "MobileBertTokenizer",
 
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "cls_token": "[CLS]",
3
  "do_lower_case": true,
4
  "mask_token": "[MASK]",
5
  "model_max_length": 1000000000000000019884624838656,
6
  "pad_token": "[PAD]",
7
  "sep_token": "[SEP]",
8
+ "special_tokens_map_file": null,
9
  "strip_accents": null,
10
  "tokenize_chinese_chars": true,
11
  "tokenizer_class": "MobileBertTokenizer",
run-4/checkpoint-214/trainer_state.json CHANGED
@@ -1,8 +1,7 @@
1
  {
2
- "best_metric": 0.03718764224408827,
3
- "best_model_checkpoint": "mobilebert-uncased-finetuned-cola/run-4/checkpoint-214",
4
- "epoch": 1.0,
5
- "eval_steps": 500,
6
  "global_step": 214,
7
  "is_hyper_param_search": true,
8
  "is_local_process_zero": true,
@@ -10,26 +9,31 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_loss": 108810.078125,
14
- "eval_matthews_correlation": 0.03718764224408827,
15
- "eval_runtime": 3.0667,
16
- "eval_samples_per_second": 340.1,
17
- "eval_steps_per_second": 21.521,
 
 
 
 
 
 
 
 
 
18
  "step": 214
19
  }
20
  ],
21
- "logging_steps": 500,
22
- "max_steps": 214,
23
- "num_input_tokens_seen": 0,
24
- "num_train_epochs": 1,
25
- "save_steps": 500,
26
  "total_flos": 0,
27
- "train_batch_size": 4,
28
  "trial_name": null,
29
  "trial_params": {
30
- "learning_rate": 2.6926940399761e-06,
31
- "num_train_epochs": 1,
32
- "per_device_train_batch_size": 4,
33
- "seed": 4
34
  }
35
  }
 
1
  {
2
+ "best_metric": 0.007984019525529589,
3
+ "best_model_checkpoint": "mobilebert-uncased-finetuned-cola/run-4/checkpoint-107",
4
+ "epoch": 2.0,
 
5
  "global_step": 214,
6
  "is_hyper_param_search": true,
7
  "is_local_process_zero": true,
 
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
+ "eval_loss": 0.7695204615592957,
13
+ "eval_matthews_correlation": 0.007984019525529589,
14
+ "eval_runtime": 2.6807,
15
+ "eval_samples_per_second": 389.079,
16
+ "eval_steps_per_second": 24.621,
17
+ "step": 107
18
+ },
19
+ {
20
+ "epoch": 2.0,
21
+ "eval_loss": 0.982637345790863,
22
+ "eval_matthews_correlation": 0.0,
23
+ "eval_runtime": 2.5108,
24
+ "eval_samples_per_second": 415.4,
25
+ "eval_steps_per_second": 26.286,
26
  "step": 214
27
  }
28
  ],
29
+ "max_steps": 428,
30
+ "num_train_epochs": 4,
 
 
 
31
  "total_flos": 0,
 
32
  "trial_name": null,
33
  "trial_params": {
34
+ "learning_rate": 2.428172543385948e-05,
35
+ "num_train_epochs": 4,
36
+ "per_device_train_batch_size": 8,
37
+ "seed": 12
38
  }
39
  }
run-4/checkpoint-214/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8bd329de3edddbb0dd3482875f0b22efe973dc98362a309a016e3810926e0724
3
- size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:134616c5175b1859b10e1348047fd02338d55705f285410aa8f7fdae509fbe5f
3
+ size 3643
runs/Mar10_12-23-35_f87fe01c66be/1710074696.770817/events.out.tfevents.1710074696.f87fe01c66be.29486.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25350c39541fbe7bafb01ffedb88851d1a5dfc9c61b16e93dd0147955877ea6c
3
+ size 5884
runs/Mar10_12-23-35_f87fe01c66be/events.out.tfevents.1710074624.f87fe01c66be.29486.9 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d4a6582370f3e422230415b8f1f5198912e25cdd14d7cac60415c577de47130e
3
- size 5269
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de10155ab0556d5bf9c88de7caca085933fe30da4d1cd65496f47156a7ed0a34
3
+ size 5623
runs/Mar10_12-23-35_f87fe01c66be/events.out.tfevents.1710074696.f87fe01c66be.29486.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54bd31bc34a38d0bfc349aa96b54ab6cae7f916e7f449d80b111a337a43ced0d
3
+ size 4938
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f666641269d2be95ebba45cd0c3329b54e018e7cffd36b81419b54a5c946a9fe
3
  size 3643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:134616c5175b1859b10e1348047fd02338d55705f285410aa8f7fdae509fbe5f
3
  size 3643