Jeremiah Zhou commited on
Commit
52163ed
1 Parent(s): 30c5adb

End of training

Browse files
all_results.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_loss": 0.5405848622322083,
4
+ "eval_matthews_correlation": 0.5880094937717885,
5
+ "eval_runtime": 5.0883,
6
+ "eval_samples": 1043,
7
+ "eval_samples_per_second": 204.979,
8
+ "eval_steps_per_second": 25.745,
9
+ "train_loss": 0.31582939565478274,
10
+ "train_runtime": 345.3367,
11
+ "train_samples": 8551,
12
+ "train_samples_per_second": 74.284,
13
+ "train_steps_per_second": 2.328
14
+ }
eval_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_loss": 0.5405848622322083,
4
+ "eval_matthews_correlation": 0.5880094937717885,
5
+ "eval_runtime": 5.0883,
6
+ "eval_samples": 1043,
7
+ "eval_samples_per_second": 204.979,
8
+ "eval_steps_per_second": 25.745
9
+ }
runs/Jun21_21-11-15_pikachu/events.out.tfevents.1655817742.pikachu.3270481.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e0efc5f3050ce0ee3718c306aade21a40878b6826de5596cc7095f6f9a7f2b6
3
+ size 375
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "train_loss": 0.31582939565478274,
4
+ "train_runtime": 345.3367,
5
+ "train_samples": 8551,
6
+ "train_samples_per_second": 74.284,
7
+ "train_steps_per_second": 2.328
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.5880094937717885,
3
+ "best_model_checkpoint": "./fine-tune/bert-base-uncased/cola/checkpoint-804",
4
+ "epoch": 3.0,
5
+ "global_step": 804,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 1.0,
12
+ "eval_loss": 0.45977166295051575,
13
+ "eval_matthews_correlation": 0.5134946392219878,
14
+ "eval_runtime": 5.9561,
15
+ "eval_samples_per_second": 175.115,
16
+ "eval_steps_per_second": 21.994,
17
+ "step": 268
18
+ },
19
+ {
20
+ "epoch": 1.87,
21
+ "learning_rate": 7.5621890547263685e-06,
22
+ "loss": 0.393,
23
+ "step": 500
24
+ },
25
+ {
26
+ "epoch": 2.0,
27
+ "eval_loss": 0.4875448942184448,
28
+ "eval_matthews_correlation": 0.5573424050983508,
29
+ "eval_runtime": 2.8786,
30
+ "eval_samples_per_second": 362.324,
31
+ "eval_steps_per_second": 45.508,
32
+ "step": 536
33
+ },
34
+ {
35
+ "epoch": 3.0,
36
+ "eval_loss": 0.5405848622322083,
37
+ "eval_matthews_correlation": 0.5880094937717885,
38
+ "eval_runtime": 5.5175,
39
+ "eval_samples_per_second": 189.036,
40
+ "eval_steps_per_second": 23.743,
41
+ "step": 804
42
+ },
43
+ {
44
+ "epoch": 3.0,
45
+ "step": 804,
46
+ "total_flos": 1687396975787520.0,
47
+ "train_loss": 0.31582939565478274,
48
+ "train_runtime": 345.3367,
49
+ "train_samples_per_second": 74.284,
50
+ "train_steps_per_second": 2.328
51
+ }
52
+ ],
53
+ "max_steps": 804,
54
+ "num_train_epochs": 3,
55
+ "total_flos": 1687396975787520.0,
56
+ "trial_name": null,
57
+ "trial_params": null
58
+ }