StevenLimcorn commited on
Commit
b88124b
1 Parent(s): 5a3bf69

End of training

Browse files
all_results.json CHANGED
@@ -1,15 +1,15 @@
1
  {
2
- "epoch": 30.0,
3
- "eval_accuracy": 0.7397590361445783,
4
- "eval_loss": 1.1226757764816284,
5
- "eval_runtime": 0.9717,
6
  "eval_samples": 6,
7
- "eval_samples_per_second": 6.175,
8
- "eval_steps_per_second": 2.058,
9
- "perplexity": 3.073066049722984,
10
- "train_loss": 1.552490357146866,
11
- "train_runtime": 2803.476,
12
  "train_samples": 229,
13
- "train_samples_per_second": 2.451,
14
- "train_steps_per_second": 0.621
15
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.6788321167883211,
4
+ "eval_loss": 1.5589643716812134,
5
+ "eval_runtime": 0.4914,
6
  "eval_samples": 6,
7
+ "eval_samples_per_second": 12.209,
8
+ "eval_steps_per_second": 4.07,
9
+ "perplexity": 4.753895426191399,
10
+ "train_loss": 2.016565941120016,
11
+ "train_runtime": 632.1099,
12
  "train_samples": 229,
13
+ "train_samples_per_second": 3.623,
14
+ "train_steps_per_second": 0.918
15
  }
eval_results.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "epoch": 30.0,
3
- "eval_accuracy": 0.7397590361445783,
4
- "eval_loss": 1.1226757764816284,
5
- "eval_runtime": 0.9717,
6
  "eval_samples": 6,
7
- "eval_samples_per_second": 6.175,
8
- "eval_steps_per_second": 2.058,
9
- "perplexity": 3.073066049722984
10
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.6788321167883211,
4
+ "eval_loss": 1.5589643716812134,
5
+ "eval_runtime": 0.4914,
6
  "eval_samples": 6,
7
+ "eval_samples_per_second": 12.209,
8
+ "eval_steps_per_second": 4.07,
9
+ "perplexity": 4.753895426191399
10
  }
runs/Apr23_10-00-54_496995bf93a4/events.out.tfevents.1682245221.496995bf93a4.66939.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10c727174bee202ba6211a25e37e968d1352ca9510705309e234cf4de9f84b34
3
+ size 363
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 30.0,
3
- "train_loss": 1.552490357146866,
4
- "train_runtime": 2803.476,
5
  "train_samples": 229,
6
- "train_samples_per_second": 2.451,
7
- "train_steps_per_second": 0.621
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "train_loss": 2.016565941120016,
4
+ "train_runtime": 632.1099,
5
  "train_samples": 229,
6
+ "train_samples_per_second": 3.623,
7
+ "train_steps_per_second": 0.918
8
  }
trainer_state.json CHANGED
@@ -1,43 +1,31 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 30.0,
5
- "global_step": 1740,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 8.62,
12
- "learning_rate": 3.563218390804598e-05,
13
- "loss": 2.043,
14
- "step": 500
15
- },
16
- {
17
- "epoch": 17.24,
18
- "learning_rate": 2.1264367816091954e-05,
19
- "loss": 1.539,
20
- "step": 1000
21
- },
22
- {
23
- "epoch": 25.86,
24
  "learning_rate": 6.896551724137932e-06,
25
- "loss": 1.2681,
26
- "step": 1500
27
  },
28
  {
29
- "epoch": 30.0,
30
- "step": 1740,
31
- "total_flos": 6403012579676160.0,
32
- "train_loss": 1.552490357146866,
33
- "train_runtime": 2803.476,
34
- "train_samples_per_second": 2.451,
35
- "train_steps_per_second": 0.621
36
  }
37
  ],
38
- "max_steps": 1740,
39
- "num_train_epochs": 30,
40
- "total_flos": 6403012579676160.0,
41
  "trial_name": null,
42
  "trial_params": null
43
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 10.0,
5
+ "global_step": 580,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 8.62,
 
 
 
 
 
 
 
 
 
 
 
 
12
  "learning_rate": 6.896551724137932e-06,
13
+ "loss": 2.0521,
14
+ "step": 500
15
  },
16
  {
17
+ "epoch": 10.0,
18
+ "step": 580,
19
+ "total_flos": 2134337526558720.0,
20
+ "train_loss": 2.016565941120016,
21
+ "train_runtime": 632.1099,
22
+ "train_samples_per_second": 3.623,
23
+ "train_steps_per_second": 0.918
24
  }
25
  ],
26
+ "max_steps": 580,
27
+ "num_train_epochs": 10,
28
+ "total_flos": 2134337526558720.0,
29
  "trial_name": null,
30
  "trial_params": null
31
  }