crossdelenna commited on
Commit
f4ca35f
·
verified ·
1 Parent(s): 065e3ae

Upload folder using huggingface_hub

Browse files
Files changed (4) hide show
  1. optimizer.pt +1 -1
  2. rng_state.pth +1 -1
  3. scheduler.pt +1 -1
  4. trainer_state.json +52 -36
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a782efdc728d114f90b12def8869d82a4bf4bb08077c7177e3d627cb2a10945
3
  size 693625338
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38a5fc0cf6ea40392dd62729ffdf797cefab021b41cd8c36fb187c0ae23a4d58
3
  size 693625338
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6d738b7a51be6af562af846720ffa1b521b2f642ec0a840cd45d5f4c9b24e16
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb6f255d22039016bd368cbeb9ec67a3324aba476af2ac6fa3c2b31955be7e84
3
  size 14244
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cd5fe0deafc847e744377630a02b485aaadcbf0c8a2ff89b7560cd716efb140
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46991dd2d014c7aba31aaaa97536010ff42c613f93552beac5e9b051ec0c9ebd
3
  size 1064
trainer_state.json CHANGED
@@ -1,51 +1,67 @@
1
  {
2
- "best_metric": 34.65030047308528,
3
- "best_model_checkpoint": "./whisper-medium.en/checkpoint-400",
4
- "epoch": 1.0335051546391754,
5
- "eval_steps": 200,
6
- "global_step": 401,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.5154639175257731,
13
- "grad_norm": 14.852355003356934,
14
- "learning_rate": 5.2685421994884914e-06,
15
- "loss": 2.2838,
16
- "step": 200
17
  },
18
  {
19
- "epoch": 0.5154639175257731,
20
- "eval_loss": 1.0020978450775146,
21
- "eval_runtime": 808.3907,
22
- "eval_samples_per_second": 1.277,
23
- "eval_steps_per_second": 0.16,
24
- "eval_wer": 36.01841196777906,
25
- "step": 200
26
  },
27
  {
28
- "epoch": 1.0309278350515463,
29
- "grad_norm": 8.327604293823242,
30
- "learning_rate": 1.534526854219949e-07,
31
- "loss": 0.9275,
32
- "step": 400
33
  },
34
  {
35
- "epoch": 1.0309278350515463,
36
- "eval_loss": 0.7616046071052551,
37
- "eval_runtime": 806.233,
38
- "eval_samples_per_second": 1.28,
39
- "eval_steps_per_second": 0.16,
40
- "eval_wer": 34.65030047308528,
41
- "step": 400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
42
  }
43
  ],
44
- "logging_steps": 200,
45
- "max_steps": 401,
46
  "num_input_tokens_seen": 0,
47
- "num_train_epochs": 2,
48
- "save_steps": 200,
49
  "stateful_callbacks": {
50
  "TrainerControl": {
51
  "args": {
@@ -53,13 +69,13 @@
53
  "should_evaluate": false,
54
  "should_log": false,
55
  "should_save": true,
56
- "should_training_stop": true
57
  },
58
  "attributes": {}
59
  }
60
  },
61
- "total_flos": 6.53799503757312e+18,
62
- "train_batch_size": 16,
63
  "trial_name": null,
64
  "trial_params": null
65
  }
 
1
  {
2
+ "best_metric": 15.138377050364909,
3
+ "best_model_checkpoint": "./whisper-medium.en/checkpoint-1050",
4
+ "epoch": 3.723404255319149,
5
+ "eval_steps": 350,
6
+ "global_step": 1050,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 1.2411347517730495,
13
+ "grad_norm": 7.018165111541748,
14
+ "learning_rate": 6.753121998078771e-06,
15
+ "loss": 0.664,
16
+ "step": 350
17
  },
18
  {
19
+ "epoch": 1.2411347517730495,
20
+ "eval_loss": 0.399837464094162,
21
+ "eval_runtime": 733.8278,
22
+ "eval_samples_per_second": 1.406,
23
+ "eval_steps_per_second": 0.064,
24
+ "eval_wer": 18.209408194233685,
25
+ "step": 350
26
  },
27
  {
28
+ "epoch": 2.482269503546099,
29
+ "grad_norm": 4.022040367126465,
30
+ "learning_rate": 3.390970220941403e-06,
31
+ "loss": 0.4625,
32
+ "step": 700
33
  },
34
  {
35
+ "epoch": 2.482269503546099,
36
+ "eval_loss": 0.3244483172893524,
37
+ "eval_runtime": 737.4383,
38
+ "eval_samples_per_second": 1.399,
39
+ "eval_steps_per_second": 0.064,
40
+ "eval_wer": 16.06329937134186,
41
+ "step": 700
42
+ },
43
+ {
44
+ "epoch": 3.723404255319149,
45
+ "grad_norm": 4.158984661102295,
46
+ "learning_rate": 2.8818443804034583e-08,
47
+ "loss": 0.3703,
48
+ "step": 1050
49
+ },
50
+ {
51
+ "epoch": 3.723404255319149,
52
+ "eval_loss": 0.3033762276172638,
53
+ "eval_runtime": 728.0181,
54
+ "eval_samples_per_second": 1.418,
55
+ "eval_steps_per_second": 0.065,
56
+ "eval_wer": 15.138377050364909,
57
+ "step": 1050
58
  }
59
  ],
60
+ "logging_steps": 350,
61
+ "max_steps": 1051,
62
  "num_input_tokens_seen": 0,
63
+ "num_train_epochs": 4,
64
+ "save_steps": 350,
65
  "stateful_callbacks": {
66
  "TrainerControl": {
67
  "args": {
 
69
  "should_evaluate": false,
70
  "should_log": false,
71
  "should_save": true,
72
+ "should_training_stop": false
73
  },
74
  "attributes": {}
75
  }
76
  },
77
+ "total_flos": 2.355760247537664e+19,
78
+ "train_batch_size": 22,
79
  "trial_name": null,
80
  "trial_params": null
81
  }