gchhablani commited on
Commit
cdee9e3
1 Parent(s): 0ae3fd9

End of training

Browse files
all_results.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_loss": 0.6499619483947754,
4
  "eval_matthews_correlation": 0.0,
5
- "eval_runtime": 23.3578,
6
  "eval_samples": 1043,
7
- "eval_samples_per_second": 44.653,
8
- "eval_steps_per_second": 5.608,
9
- "train_loss": 0.0,
10
- "train_runtime": 0.0205,
11
  "train_samples": 8551,
12
- "train_samples_per_second": 1248914.483,
13
- "train_steps_per_second": 312265.134
14
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "eval_loss": 0.6500726342201233,
4
  "eval_matthews_correlation": 0.0,
5
+ "eval_runtime": 23.0231,
6
  "eval_samples": 1043,
7
+ "eval_samples_per_second": 45.302,
8
+ "eval_steps_per_second": 5.69,
9
+ "train_loss": 0.2530779532565482,
10
+ "train_runtime": 1420.0633,
11
  "train_samples": 8551,
12
+ "train_samples_per_second": 30.108,
13
+ "train_steps_per_second": 7.528
14
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_loss": 0.6499619483947754,
4
  "eval_matthews_correlation": 0.0,
5
- "eval_runtime": 23.3578,
6
  "eval_samples": 1043,
7
- "eval_samples_per_second": 44.653,
8
- "eval_steps_per_second": 5.608
9
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "eval_loss": 0.6500726342201233,
4
  "eval_matthews_correlation": 0.0,
5
+ "eval_runtime": 23.0231,
6
  "eval_samples": 1043,
7
+ "eval_samples_per_second": 45.302,
8
+ "eval_steps_per_second": 5.69
9
  }
runs/Oct10_19-05-40_patrick-general-gpu/events.out.tfevents.1633892756.patrick-general-gpu.125503.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1c948bd98023c44aa14a8569fddadf0202d6d271d154cb83234eaf39d0811306
3
- size 4260
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03fb645e00e2084e20fb6a704ba71080e4c774bd2c71f9a07a3ec0e1719f6cd9
3
+ size 4614
runs/Oct10_19-05-40_patrick-general-gpu/events.out.tfevents.1633894217.patrick-general-gpu.125503.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c20c35361cbf4976f5b9d6dedeb387031cbd381449eb2474220cabbf2f30fff6
3
+ size 375
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "train_loss": 0.0,
4
- "train_runtime": 0.0205,
5
  "train_samples": 8551,
6
- "train_samples_per_second": 1248914.483,
7
- "train_steps_per_second": 312265.134
8
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "train_loss": 0.2530779532565482,
4
+ "train_runtime": 1420.0633,
5
  "train_samples": 8551,
6
+ "train_samples_per_second": 30.108,
7
+ "train_steps_per_second": 7.528
8
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.0,
5
- "global_step": 6414,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -53,18 +53,48 @@
53
  "step": 6414
54
  },
55
  {
56
- "epoch": 3.0,
57
- "step": 6414,
58
- "total_flos": 1.6048929796061184e+16,
59
- "train_loss": 0.0,
60
- "train_runtime": 0.0205,
61
- "train_samples_per_second": 1248914.483,
62
- "train_steps_per_second": 312265.134
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  }
64
  ],
65
- "max_steps": 6414,
66
- "num_train_epochs": 3,
67
- "total_flos": 1.6048929796061184e+16,
68
  "trial_name": null,
69
  "trial_params": null
70
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 5.0,
5
+ "global_step": 10690,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
53
  "step": 6414
54
  },
55
  {
56
+ "epoch": 4.0,
57
+ "learning_rate": 8.966666666666667e-06,
58
+ "loss": 0.6342,
59
+ "step": 8552
60
+ },
61
+ {
62
+ "epoch": 4.0,
63
+ "eval_loss": 0.6344217658042908,
64
+ "eval_matthews_correlation": 0.0,
65
+ "eval_runtime": 22.7688,
66
+ "eval_samples_per_second": 45.808,
67
+ "eval_steps_per_second": 5.753,
68
+ "step": 8552
69
+ },
70
+ {
71
+ "epoch": 5.0,
72
+ "learning_rate": 1e-07,
73
+ "loss": 0.6312,
74
+ "step": 10690
75
+ },
76
+ {
77
+ "epoch": 5.0,
78
+ "eval_loss": 0.6500726342201233,
79
+ "eval_matthews_correlation": 0.0,
80
+ "eval_runtime": 22.7519,
81
+ "eval_samples_per_second": 45.842,
82
+ "eval_steps_per_second": 5.758,
83
+ "step": 10690
84
+ },
85
+ {
86
+ "epoch": 5.0,
87
+ "step": 10690,
88
+ "total_flos": 2.674821632676864e+16,
89
+ "train_loss": 0.2530779532565482,
90
+ "train_runtime": 1420.0633,
91
+ "train_samples_per_second": 30.108,
92
+ "train_steps_per_second": 7.528
93
  }
94
  ],
95
+ "max_steps": 10690,
96
+ "num_train_epochs": 5,
97
+ "total_flos": 2.674821632676864e+16,
98
  "trial_name": null,
99
  "trial_params": null
100
  }