obudzecie commited on
Commit
e7dc6da
·
verified ·
1 Parent(s): 1bf1cdd

Training in progress, epoch 1

Browse files
Files changed (38) hide show
  1. model.safetensors +1 -1
  2. run-3/checkpoint-108/model.safetensors +1 -1
  3. run-3/checkpoint-108/optimizer.pt +1 -1
  4. run-3/checkpoint-108/rng_state.pth +1 -1
  5. run-3/checkpoint-108/scheduler.pt +1 -1
  6. run-3/checkpoint-108/trainer_state.json +17 -17
  7. run-3/checkpoint-108/training_args.bin +1 -1
  8. run-3/checkpoint-162/config.json +25 -0
  9. run-3/checkpoint-162/model.safetensors +3 -0
  10. run-3/checkpoint-162/optimizer.pt +3 -0
  11. run-3/checkpoint-162/rng_state.pth +3 -0
  12. run-3/checkpoint-162/scheduler.pt +3 -0
  13. run-3/checkpoint-162/special_tokens_map.json +7 -0
  14. run-3/checkpoint-162/tokenizer.json +0 -0
  15. run-3/checkpoint-162/tokenizer_config.json +55 -0
  16. run-3/checkpoint-162/trainer_state.json +53 -0
  17. run-3/checkpoint-162/training_args.bin +3 -0
  18. run-3/checkpoint-162/vocab.txt +0 -0
  19. run-3/checkpoint-54/model.safetensors +1 -1
  20. run-3/checkpoint-54/optimizer.pt +1 -1
  21. run-3/checkpoint-54/rng_state.pth +1 -1
  22. run-3/checkpoint-54/scheduler.pt +1 -1
  23. run-3/checkpoint-54/trainer_state.json +11 -11
  24. run-3/checkpoint-54/training_args.bin +1 -1
  25. run-4/checkpoint-27/model.safetensors +1 -1
  26. run-4/checkpoint-27/optimizer.pt +1 -1
  27. run-4/checkpoint-27/rng_state.pth +2 -2
  28. run-4/checkpoint-27/scheduler.pt +1 -1
  29. run-4/checkpoint-27/trainer_state.json +13 -13
  30. run-4/checkpoint-27/training_args.bin +1 -1
  31. run-4/checkpoint-54/model.safetensors +1 -1
  32. run-4/checkpoint-54/optimizer.pt +1 -1
  33. run-4/checkpoint-54/rng_state.pth +2 -2
  34. run-4/checkpoint-54/scheduler.pt +1 -1
  35. run-4/checkpoint-54/trainer_state.json +17 -17
  36. run-4/checkpoint-54/training_args.bin +1 -1
  37. runs/Feb27_18-29-22_d3d09c0dfc16/events.out.tfevents.1709062232.d3d09c0dfc16.836.15 +3 -0
  38. training_args.bin +1 -1
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb5ded2d8837a663201a30e2fdd4c372dbd041adbea6fbb11f8318d354748fa3
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02caef41fefa36cf5f027762072464d39baa40817c70225bb534790af6f857bf
3
  size 267832560
run-3/checkpoint-108/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2049d4ff235930194209bcadba68c9f28941831d6be8afb9ab23bc11cad98cf8
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:642d76e7cafeab26ef3b6b0e615ba8c803a310d9ea436c6591c9c7398171fa59
3
  size 267832560
run-3/checkpoint-108/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee583b89c741c6d92754ea2b2acf8a5bd79e33ef5565146603053c67e8cd7737
3
  size 535727290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6944dd1154c9965be4b93a2d85a0a4673484630eec4a0f52b3ae37dfc1f0641a
3
  size 535727290
run-3/checkpoint-108/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3e297b7ae7c4df82a1ce845cf84be286dc57704c50dd059929e95c24abad79b
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00e7e60447fe6b0b398d23f91b0df5696220d68e25fe4da0911193612264b803
3
  size 14244
run-3/checkpoint-108/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:19359dc969a3dad51efa9a2d6f6d5e94a562a510034e89ecbf12473bedf87e37
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94f038ef9a5ad66a472c64034862a7278e5094b40e5d1c995ba1d16aa99930e3
3
  size 1064
run-3/checkpoint-108/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.0,
3
- "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-54",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
6
  "global_step": 108,
@@ -10,35 +10,35 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_loss": 0.6135343909263611,
14
- "eval_matthews_correlation": 0.0,
15
- "eval_runtime": 0.6686,
16
- "eval_samples_per_second": 1560.01,
17
- "eval_steps_per_second": 98.716,
18
  "step": 54
19
  },
20
  {
21
  "epoch": 2.0,
22
- "eval_loss": 0.6109986901283264,
23
- "eval_matthews_correlation": 0.0,
24
- "eval_runtime": 1.2142,
25
- "eval_samples_per_second": 859.036,
26
- "eval_steps_per_second": 54.359,
27
  "step": 108
28
  }
29
  ],
30
  "logging_steps": 500,
31
- "max_steps": 108,
32
  "num_input_tokens_seen": 0,
33
- "num_train_epochs": 2,
34
  "save_steps": 500,
35
  "total_flos": 0,
36
  "train_batch_size": 16,
37
  "trial_name": null,
38
  "trial_params": {
39
- "learning_rate": 7.371411848219159e-06,
40
- "num_train_epochs": 2,
41
  "per_device_train_batch_size": 16,
42
- "seed": 35
43
  }
44
  }
 
1
  {
2
+ "best_metric": 0.3349942831439903,
3
+ "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-108",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
6
  "global_step": 108,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_loss": 0.5624595880508423,
14
+ "eval_matthews_correlation": 0.10385466804655791,
15
+ "eval_runtime": 1.2797,
16
+ "eval_samples_per_second": 815.034,
17
+ "eval_steps_per_second": 102.368,
18
  "step": 54
19
  },
20
  {
21
  "epoch": 2.0,
22
+ "eval_loss": 0.6093302965164185,
23
+ "eval_matthews_correlation": 0.3349942831439903,
24
+ "eval_runtime": 1.2473,
25
+ "eval_samples_per_second": 836.218,
26
+ "eval_steps_per_second": 105.028,
27
  "step": 108
28
  }
29
  ],
30
  "logging_steps": 500,
31
+ "max_steps": 162,
32
  "num_input_tokens_seen": 0,
33
+ "num_train_epochs": 3,
34
  "save_steps": 500,
35
  "total_flos": 0,
36
  "train_batch_size": 16,
37
  "trial_name": null,
38
  "trial_params": {
39
+ "learning_rate": 5.503532571253603e-05,
40
+ "num_train_epochs": 3,
41
  "per_device_train_batch_size": 16,
42
+ "seed": 28
43
  }
44
  }
run-3/checkpoint-108/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6ae447073f49fbe1616e5d8dd0fa3e8b79bcfd527890bf6b4740cb1b9964bfc
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e3db3d5ec943b438ad149fa26941b66a79396dd3ca6343d9f839d70c53ba46e
3
  size 4984
run-3/checkpoint-162/config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert-base-uncased",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForSequenceClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "initializer_range": 0.02,
12
+ "max_position_embeddings": 512,
13
+ "model_type": "distilbert",
14
+ "n_heads": 12,
15
+ "n_layers": 6,
16
+ "pad_token_id": 0,
17
+ "problem_type": "single_label_classification",
18
+ "qa_dropout": 0.1,
19
+ "seq_classif_dropout": 0.2,
20
+ "sinusoidal_pos_embds": false,
21
+ "tie_weights_": true,
22
+ "torch_dtype": "float32",
23
+ "transformers_version": "4.38.1",
24
+ "vocab_size": 30522
25
+ }
run-3/checkpoint-162/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6abceff8f22a2cfd12053432245d5933303321858fe56f5c7fb47d0632575343
3
+ size 267832560
run-3/checkpoint-162/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dac662f6204023e4b708390d71585cbfe36afa461bddbc778c15d7fc7327a0d
3
+ size 535727290
run-3/checkpoint-162/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:210f6311babf339b2041dd94e325452cfc47bb4600ce72bcc997b3fc1f605149
3
+ size 14244
run-3/checkpoint-162/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8057fb71e85d5890ca5afa2a056fc36a323c67edad6e2652270aca621736ccbd
3
+ size 1064
run-3/checkpoint-162/special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
run-3/checkpoint-162/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
run-3/checkpoint-162/tokenizer_config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_lower_case": true,
47
+ "mask_token": "[MASK]",
48
+ "model_max_length": 512,
49
+ "pad_token": "[PAD]",
50
+ "sep_token": "[SEP]",
51
+ "strip_accents": null,
52
+ "tokenize_chinese_chars": true,
53
+ "tokenizer_class": "DistilBertTokenizer",
54
+ "unk_token": "[UNK]"
55
+ }
run-3/checkpoint-162/trainer_state.json ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.346176833033057,
3
+ "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-162",
4
+ "epoch": 3.0,
5
+ "eval_steps": 500,
6
+ "global_step": 162,
7
+ "is_hyper_param_search": true,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_loss": 0.5624595880508423,
14
+ "eval_matthews_correlation": 0.10385466804655791,
15
+ "eval_runtime": 1.2797,
16
+ "eval_samples_per_second": 815.034,
17
+ "eval_steps_per_second": 102.368,
18
+ "step": 54
19
+ },
20
+ {
21
+ "epoch": 2.0,
22
+ "eval_loss": 0.6093302965164185,
23
+ "eval_matthews_correlation": 0.3349942831439903,
24
+ "eval_runtime": 1.2473,
25
+ "eval_samples_per_second": 836.218,
26
+ "eval_steps_per_second": 105.028,
27
+ "step": 108
28
+ },
29
+ {
30
+ "epoch": 3.0,
31
+ "eval_loss": 0.7864214777946472,
32
+ "eval_matthews_correlation": 0.346176833033057,
33
+ "eval_runtime": 1.4034,
34
+ "eval_samples_per_second": 743.189,
35
+ "eval_steps_per_second": 93.344,
36
+ "step": 162
37
+ }
38
+ ],
39
+ "logging_steps": 500,
40
+ "max_steps": 162,
41
+ "num_input_tokens_seen": 0,
42
+ "num_train_epochs": 3,
43
+ "save_steps": 500,
44
+ "total_flos": 0,
45
+ "train_batch_size": 16,
46
+ "trial_name": null,
47
+ "trial_params": {
48
+ "learning_rate": 5.503532571253603e-05,
49
+ "num_train_epochs": 3,
50
+ "per_device_train_batch_size": 16,
51
+ "seed": 28
52
+ }
53
+ }
run-3/checkpoint-162/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e3db3d5ec943b438ad149fa26941b66a79396dd3ca6343d9f839d70c53ba46e
3
+ size 4984
run-3/checkpoint-162/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
 
run-3/checkpoint-54/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a07b3521cc8479b97635017fd08648a7bea2791ad6ec7bace28d41fb6d5321c4
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb5ded2d8837a663201a30e2fdd4c372dbd041adbea6fbb11f8318d354748fa3
3
  size 267832560
run-3/checkpoint-54/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3c9bdaa0c6dd042796f0553c74172060ba3f9ff26517f16579571c24bcf23ae
3
  size 535727290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6eaa5dd6b072e42070f8bc0572641f570e5d8203f8d3d310146222a81e68a48c
3
  size 535727290
run-3/checkpoint-54/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b760589f8554fc9a823461802d959d20ee6933034d468005d9e9650985646e1
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29c2d4d1404a256eed2965ed677a952e14f2bcce3c6968bd06bbea290182bad5
3
  size 14244
run-3/checkpoint-54/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e821cd8c0cea6045dab45710ac190a0970d06aa7c327d90cc1165ca399b6078
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1527b641c9f756a5765a3afc0eb992211442419cc2281db17ece7b38dc9271c0
3
  size 1064
run-3/checkpoint-54/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.0,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-54",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
@@ -10,26 +10,26 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_loss": 0.6135343909263611,
14
- "eval_matthews_correlation": 0.0,
15
- "eval_runtime": 0.6686,
16
- "eval_samples_per_second": 1560.01,
17
- "eval_steps_per_second": 98.716,
18
  "step": 54
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 108,
23
  "num_input_tokens_seen": 0,
24
- "num_train_epochs": 2,
25
  "save_steps": 500,
26
  "total_flos": 0,
27
  "train_batch_size": 16,
28
  "trial_name": null,
29
  "trial_params": {
30
- "learning_rate": 7.371411848219159e-06,
31
- "num_train_epochs": 2,
32
  "per_device_train_batch_size": 16,
33
- "seed": 35
34
  }
35
  }
 
1
  {
2
+ "best_metric": 0.10385466804655791,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-54",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_loss": 0.5624595880508423,
14
+ "eval_matthews_correlation": 0.10385466804655791,
15
+ "eval_runtime": 1.2797,
16
+ "eval_samples_per_second": 815.034,
17
+ "eval_steps_per_second": 102.368,
18
  "step": 54
19
  }
20
  ],
21
  "logging_steps": 500,
22
+ "max_steps": 162,
23
  "num_input_tokens_seen": 0,
24
+ "num_train_epochs": 3,
25
  "save_steps": 500,
26
  "total_flos": 0,
27
  "train_batch_size": 16,
28
  "trial_name": null,
29
  "trial_params": {
30
+ "learning_rate": 5.503532571253603e-05,
31
+ "num_train_epochs": 3,
32
  "per_device_train_batch_size": 16,
33
+ "seed": 28
34
  }
35
  }
run-3/checkpoint-54/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6ae447073f49fbe1616e5d8dd0fa3e8b79bcfd527890bf6b4740cb1b9964bfc
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e3db3d5ec943b438ad149fa26941b66a79396dd3ca6343d9f839d70c53ba46e
3
  size 4984
run-4/checkpoint-27/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4542ea02296c83bed04f3c54cf00db1bc8503bfaad3f396b82b3e6187ab61d9
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02caef41fefa36cf5f027762072464d39baa40817c70225bb534790af6f857bf
3
  size 267832560
run-4/checkpoint-27/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3047b77b90fa6d77cafeafdcbc70682204686a1d2c84e65c2d0e9e3d85bf779
3
  size 535727290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ecd5623494e65cfa6c6677d1d9819c3f3c662876a8aed41ae386887f83058da
3
  size 535727290
run-4/checkpoint-27/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:48abff7665a73e9406f2b3a959d01e6695705f7feda5c2b9fb6e70fad11bc462
3
- size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a4a2560c602f523c91c485207028a3dbcb7126aebac96a22736d83aa2ec429e
3
+ size 14308
run-4/checkpoint-27/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:89c5e803b7810f245162c0c757de90c445efa6c3ac6f29e78ca07f90ca825d2a
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6aa53b3d0a4d6382222988653cd7469ec80a1749702e6aee6c8c16d249816344
3
  size 1064
run-4/checkpoint-27/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.0,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-27",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
@@ -10,26 +10,26 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_loss": 0.6171508431434631,
14
- "eval_matthews_correlation": 0.0,
15
- "eval_runtime": 1.2254,
16
- "eval_samples_per_second": 851.142,
17
- "eval_steps_per_second": 106.903,
18
  "step": 27
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 135,
23
  "num_input_tokens_seen": 0,
24
- "num_train_epochs": 5,
25
  "save_steps": 500,
26
  "total_flos": 0,
27
- "train_batch_size": 16,
28
  "trial_name": null,
29
  "trial_params": {
30
- "learning_rate": 7.141254091425431e-06,
31
- "num_train_epochs": 5,
32
- "per_device_train_batch_size": 16,
33
- "seed": 4
34
  }
35
  }
 
1
  {
2
+ "best_metric": -0.020702674026557004,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-27",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_loss": 0.669028103351593,
14
+ "eval_matthews_correlation": -0.020702674026557004,
15
+ "eval_runtime": 0.9548,
16
+ "eval_samples_per_second": 1092.354,
17
+ "eval_steps_per_second": 137.199,
18
  "step": 27
19
  }
20
  ],
21
  "logging_steps": 500,
22
+ "max_steps": 54,
23
  "num_input_tokens_seen": 0,
24
+ "num_train_epochs": 2,
25
  "save_steps": 500,
26
  "total_flos": 0,
27
+ "train_batch_size": 32,
28
  "trial_name": null,
29
  "trial_params": {
30
+ "learning_rate": 2.7461506090980817e-06,
31
+ "num_train_epochs": 2,
32
+ "per_device_train_batch_size": 32,
33
+ "seed": 24
34
  }
35
  }
run-4/checkpoint-27/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b272556a909ee8d46e26a918cf12e067d37cdfcdb6fc7bb9dd145e02aa9cb279
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ef1f877c640f97e98c8da61a50566872c84628849589a156be7119b1ff81f04
3
  size 4984
run-4/checkpoint-54/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8ffa22d670fd8d875f0874f56277b766324b6c576424e31e03488878974f06c
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb80a875bbe0413ac86706048ef604bc174b717e8166512c5cdf1e3ef4e86279
3
  size 267832560
run-4/checkpoint-54/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:711bd5c2eaa53854115a17390ce4ca1f9f8640bbf3bf3d9d3682e3ea030b8b2b
3
  size 535727290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10df1ad217933501acd883e6fa992bba33d96998aef9f160d25e699c875811fa
3
  size 535727290
run-4/checkpoint-54/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7daa4263b1198655a1441081a5b33c5bce53494dcd0610b8798d313ef92eff4e
3
- size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63d63a234463881e0d3edc4fc567ea7c1bae29e71ad748fcee605f8784baf6e3
3
+ size 14308
run-4/checkpoint-54/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab38497e119d49371b53e85f5cfb7d41c0903e3c9879e2bb0e6b7c1e0e7bff52
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:446a76f3ec584c657712cc0b5cb821862b8c52c9581d425f442d00177034fa3b
3
  size 1064
run-4/checkpoint-54/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "best_metric": 0.0,
3
- "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-27",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
6
  "global_step": 54,
@@ -10,35 +10,35 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_loss": 0.6171508431434631,
14
- "eval_matthews_correlation": 0.0,
15
- "eval_runtime": 1.2254,
16
- "eval_samples_per_second": 851.142,
17
- "eval_steps_per_second": 106.903,
18
  "step": 27
19
  },
20
  {
21
  "epoch": 2.0,
22
- "eval_loss": 0.6099013686180115,
23
  "eval_matthews_correlation": 0.0,
24
- "eval_runtime": 1.2265,
25
- "eval_samples_per_second": 850.398,
26
- "eval_steps_per_second": 106.809,
27
  "step": 54
28
  }
29
  ],
30
  "logging_steps": 500,
31
- "max_steps": 135,
32
  "num_input_tokens_seen": 0,
33
- "num_train_epochs": 5,
34
  "save_steps": 500,
35
  "total_flos": 0,
36
- "train_batch_size": 16,
37
  "trial_name": null,
38
  "trial_params": {
39
- "learning_rate": 7.141254091425431e-06,
40
- "num_train_epochs": 5,
41
- "per_device_train_batch_size": 16,
42
- "seed": 4
43
  }
44
  }
 
1
  {
2
  "best_metric": 0.0,
3
+ "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-4/checkpoint-54",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
6
  "global_step": 54,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_loss": 0.669028103351593,
14
+ "eval_matthews_correlation": -0.020702674026557004,
15
+ "eval_runtime": 0.9548,
16
+ "eval_samples_per_second": 1092.354,
17
+ "eval_steps_per_second": 137.199,
18
  "step": 27
19
  },
20
  {
21
  "epoch": 2.0,
22
+ "eval_loss": 0.6553832292556763,
23
  "eval_matthews_correlation": 0.0,
24
+ "eval_runtime": 1.9693,
25
+ "eval_samples_per_second": 529.631,
26
+ "eval_steps_per_second": 66.521,
27
  "step": 54
28
  }
29
  ],
30
  "logging_steps": 500,
31
+ "max_steps": 54,
32
  "num_input_tokens_seen": 0,
33
+ "num_train_epochs": 2,
34
  "save_steps": 500,
35
  "total_flos": 0,
36
+ "train_batch_size": 32,
37
  "trial_name": null,
38
  "trial_params": {
39
+ "learning_rate": 2.7461506090980817e-06,
40
+ "num_train_epochs": 2,
41
+ "per_device_train_batch_size": 32,
42
+ "seed": 24
43
  }
44
  }
run-4/checkpoint-54/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b272556a909ee8d46e26a918cf12e067d37cdfcdb6fc7bb9dd145e02aa9cb279
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ef1f877c640f97e98c8da61a50566872c84628849589a156be7119b1ff81f04
3
  size 4984
runs/Feb27_18-29-22_d3d09c0dfc16/events.out.tfevents.1709062232.d3d09c0dfc16.836.15 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5542e74d80b551a338d73a53a7a3d383a29704cb6df5464aff0eea8b05f9741c
3
+ size 5547
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e3db3d5ec943b438ad149fa26941b66a79396dd3ca6343d9f839d70c53ba46e
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ef1f877c640f97e98c8da61a50566872c84628849589a156be7119b1ff81f04
3
  size 4984