KevinKibe commited on
Commit
c39408b
1 Parent(s): 343fb75

Training in progress, step 10, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -23,8 +23,8 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "q_proj",
27
- "v_proj"
28
  ],
29
  "task_type": null,
30
  "use_dora": false,
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
+ "v_proj",
27
+ "q_proj"
28
  ],
29
  "task_type": null,
30
  "use_dora": false,
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3817bdac47941aa18c809cca5ac9efbb6b46c4006fc14104768df724ee8242b
3
  size 62969640
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c4bcc45e6a8da2ae160f9bd65758048abe4faf10b4343a1aedbe1bf55f148e2
3
  size 62969640
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b9f618664b5498348481f486e1963fddf3dc94b99759ca6beed2f98fca4dee3e
3
  size 21304084
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d05d9fe8f5a25b04f4025ef8dfde06c9cb8706f062556efa4dddd6d869f62cb
3
  size 21304084
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f73514fbd7715a5444d57d8a29c96393312f999f2b3d122ec2a6d7e76ffb689d
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:911c06249d601e638f8189d761307ccdbacc556cb7c9096b657158b80e91a9fb
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:691263e55c7bb34b6e090bd89cf079f362100d7bd758be475bd3e7091c1a4ed6
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4849a6ac0a1d895740f1ab4eba9d346b8d898008d0cfe93dd108cd928d7c63e
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,99 +1,35 @@
1
  {
2
- "best_metric": 72.41379310344827,
3
- "best_model_checkpoint": "../openai/whisper-large-v3-finetuned/checkpoint-20",
4
- "epoch": 7.09,
5
- "eval_steps": 20,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 1.07,
13
- "grad_norm": 1.2736600637435913,
14
  "learning_rate": 0.0001,
15
- "loss": 0.054,
16
- "step": 20
17
  },
18
  {
19
- "epoch": 1.07,
20
- "eval_loss": 2.1966075897216797,
21
- "eval_runtime": 68.9209,
22
- "eval_samples_per_second": 0.145,
23
- "eval_steps_per_second": 0.044,
24
- "eval_wer": 72.41379310344827,
25
- "step": 20
26
- },
27
- {
28
- "epoch": 3.01,
29
- "grad_norm": 0.4058435261249542,
30
- "learning_rate": 0.0001,
31
- "loss": 0.0226,
32
- "step": 40
33
- },
34
- {
35
- "epoch": 3.01,
36
- "eval_loss": 2.285231351852417,
37
- "eval_runtime": 69.6442,
38
- "eval_samples_per_second": 0.144,
39
- "eval_steps_per_second": 0.043,
40
- "eval_wer": 79.3103448275862,
41
- "step": 40
42
- },
43
- {
44
- "epoch": 4.08,
45
- "grad_norm": 0.26837655901908875,
46
- "learning_rate": 0.0001,
47
- "loss": 0.0124,
48
- "step": 60
49
- },
50
- {
51
- "epoch": 4.08,
52
- "eval_loss": 2.316169023513794,
53
- "eval_runtime": 217.2614,
54
- "eval_samples_per_second": 0.046,
55
- "eval_steps_per_second": 0.014,
56
- "eval_wer": 147.1264367816092,
57
- "step": 60
58
- },
59
- {
60
- "epoch": 6.02,
61
- "grad_norm": 0.08057563006877899,
62
- "learning_rate": 0.0001,
63
- "loss": 0.0061,
64
- "step": 80
65
- },
66
- {
67
- "epoch": 6.02,
68
- "eval_loss": 2.2900302410125732,
69
- "eval_runtime": 68.7884,
70
- "eval_samples_per_second": 0.145,
71
- "eval_steps_per_second": 0.044,
72
- "eval_wer": 74.71264367816092,
73
- "step": 80
74
- },
75
- {
76
- "epoch": 7.09,
77
- "grad_norm": 0.15883919596672058,
78
- "learning_rate": 0.0001,
79
- "loss": 0.0039,
80
- "step": 100
81
- },
82
- {
83
- "epoch": 7.09,
84
- "eval_loss": 2.3415772914886475,
85
- "eval_runtime": 216.593,
86
- "eval_samples_per_second": 0.046,
87
- "eval_steps_per_second": 0.014,
88
- "eval_wer": 141.3793103448276,
89
- "step": 100
90
  }
91
  ],
92
- "logging_steps": 20,
93
- "max_steps": 100,
94
  "num_input_tokens_seen": 0,
95
  "num_train_epochs": 9223372036854775807,
96
- "save_steps": 20,
97
  "stateful_callbacks": {
98
  "TrainerControl": {
99
  "args": {
@@ -101,13 +37,13 @@
101
  "should_evaluate": false,
102
  "should_log": false,
103
  "should_save": true,
104
- "should_training_stop": true
105
  },
106
  "attributes": {}
107
  }
108
  },
109
- "total_flos": 1.32542251794432e+18,
110
- "train_batch_size": 4,
111
  "trial_name": null,
112
  "trial_params": null
113
  }
 
1
  {
2
+ "best_metric": 31.16279069767442,
3
+ "best_model_checkpoint": "../openai/whisper-large-v3-finetuned/checkpoint-10",
4
+ "epoch": 3.033333333333333,
5
+ "eval_steps": 10,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 3.033333333333333,
13
+ "grad_norm": 1.5397560596466064,
14
  "learning_rate": 0.0001,
15
+ "loss": 3.2643,
16
+ "step": 10
17
  },
18
  {
19
+ "epoch": 3.033333333333333,
20
+ "eval_loss": 3.1313788890838623,
21
+ "eval_runtime": 127.0315,
22
+ "eval_samples_per_second": 0.157,
23
+ "eval_steps_per_second": 0.024,
24
+ "eval_wer": 31.16279069767442,
25
+ "step": 10
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  }
27
  ],
28
+ "logging_steps": 10,
29
+ "max_steps": 30,
30
  "num_input_tokens_seen": 0,
31
  "num_train_epochs": 9223372036854775807,
32
+ "save_steps": 10,
33
  "stateful_callbacks": {
34
  "TrainerControl": {
35
  "args": {
 
37
  "should_evaluate": false,
38
  "should_log": false,
39
  "should_save": true,
40
+ "should_training_stop": false
41
  },
42
  "attributes": {}
43
  }
44
  },
45
+ "total_flos": 2.3349412233216e+17,
46
+ "train_batch_size": 8,
47
  "trial_name": null,
48
  "trial_params": null
49
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d67fe5c97768c67bbca82cd2f92b09330635f100897633240c3099087275ae4
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73a2e914d430abee1d595139dd59f39cb44c03ff7a239558cb1fd89c77c3cef7
3
  size 5368