mattchurgin commited on
Commit
7b922ac
1 Parent(s): b678f60

End of training

Browse files
all_results.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
- "epoch": 1.0,
3
  "eval_loss": Infinity,
4
- "eval_runtime": 10.8674,
5
  "eval_samples": 301,
6
- "eval_samples_per_second": 27.697,
7
- "eval_steps_per_second": 3.497,
8
  "eval_wer": 1.0,
9
- "train_loss": 4.538612365722656,
10
- "train_runtime": 34.6,
11
  "train_samples": 704,
12
- "train_samples_per_second": 20.347,
13
- "train_steps_per_second": 2.543
14
  }
 
1
  {
2
+ "epoch": 3.0,
3
  "eval_loss": Infinity,
4
+ "eval_runtime": 10.6149,
5
  "eval_samples": 301,
6
+ "eval_samples_per_second": 28.356,
7
+ "eval_steps_per_second": 3.58,
8
  "eval_wer": 1.0,
9
+ "train_loss": 3.7429571440725615,
10
+ "train_runtime": 101.8953,
11
  "train_samples": 704,
12
+ "train_samples_per_second": 20.727,
13
+ "train_steps_per_second": 2.591
14
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 1.0,
3
  "eval_loss": Infinity,
4
- "eval_runtime": 10.8674,
5
  "eval_samples": 301,
6
- "eval_samples_per_second": 27.697,
7
- "eval_steps_per_second": 3.497,
8
  "eval_wer": 1.0
9
  }
 
1
  {
2
+ "epoch": 3.0,
3
  "eval_loss": Infinity,
4
+ "eval_runtime": 10.6149,
5
  "eval_samples": 301,
6
+ "eval_samples_per_second": 28.356,
7
+ "eval_steps_per_second": 3.58,
8
  "eval_wer": 1.0
9
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee4994b157fac9f1a49cc194ac61e2788cef6585a7610317e8349aea741d5a30
3
  size 1247823
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:941203e6a17701b67c1cafc3d6cb41d4cf74fc16cad3faa57ca84153d5da0cd2
3
  size 1247823
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.0,
3
- "train_loss": 4.538612365722656,
4
- "train_runtime": 34.6,
5
  "train_samples": 704,
6
- "train_samples_per_second": 20.347,
7
- "train_steps_per_second": 2.543
8
  }
 
1
  {
2
+ "epoch": 3.0,
3
+ "train_loss": 3.7429571440725615,
4
+ "train_runtime": 101.8953,
5
  "train_samples": 704,
6
+ "train_samples_per_second": 20.727,
7
+ "train_steps_per_second": 2.591
8
  }
trainer_state.json CHANGED
@@ -1,25 +1,25 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.0,
5
- "global_step": 88,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 1.0,
12
- "step": 88,
13
- "total_flos": 130613499224064.0,
14
- "train_loss": 4.538612365722656,
15
- "train_runtime": 34.6,
16
- "train_samples_per_second": 20.347,
17
- "train_steps_per_second": 2.543
18
  }
19
  ],
20
- "max_steps": 88,
21
- "num_train_epochs": 1,
22
- "total_flos": 130613499224064.0,
23
  "trial_name": null,
24
  "trial_params": null
25
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.0,
5
+ "global_step": 264,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 3.0,
12
+ "step": 264,
13
+ "total_flos": 391664972335104.0,
14
+ "train_loss": 3.7429571440725615,
15
+ "train_runtime": 101.8953,
16
+ "train_samples_per_second": 20.727,
17
+ "train_steps_per_second": 2.591
18
  }
19
  ],
20
+ "max_steps": 264,
21
+ "num_train_epochs": 3,
22
+ "total_flos": 391664972335104.0,
23
  "trial_name": null,
24
  "trial_params": null
25
  }