tensorboy commited on
Commit
70b864f
1 Parent(s): 24130d4

Model save

Browse files
README.md CHANGED
@@ -1,6 +1,4 @@
1
  ---
2
- license: apache-2.0
3
- base_model: openai/whisper-tiny
4
  tags:
5
  - generated_from_trainer
6
  metrics:
@@ -15,10 +13,10 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # whisper-tiny-hi2_test
17
 
18
- This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the None dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.5557
21
- - Wer: 60.5843
22
 
23
  ## Model description
24
 
 
1
  ---
 
 
2
  tags:
3
  - generated_from_trainer
4
  metrics:
 
13
 
14
  # whisper-tiny-hi2_test
15
 
16
+ This model was trained from scratch on the None dataset.
17
  It achieves the following results on the evaluation set:
18
+ - Loss: 0.4940
19
+ - Wer: 59.7206
20
 
21
  ## Model description
22
 
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "openai/whisper-tiny",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
 
1
  {
2
+ "_name_or_path": "./whisper-tiny-hi2_test/whisper-tiny-hi-checkpoint-1",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
runs/Jun26_08-55-05_bharatsahaiyak-test/events.out.tfevents.1719392105.bharatsahaiyak-test.1215638.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:165d0582673ef188b9d52b9c14d1a45c51671773f3298a7eb630d6fb6f82e50a
3
+ size 6048
runs/Jun26_08-55-05_bharatsahaiyak-test/events.out.tfevents.1719392419.bharatsahaiyak-test.1215638.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:778b4630a2197cb19c0539dab2ab6c6ebbfe08a5a766bb35019cf7a58d314172
3
+ size 406
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3a2d63b5e8da641a253ed23f58db5d3da9941bebd2a70aef95105c81a4fa484
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9287bb38beb16bf58664c3ed10f735c1bd05dd62bb178cf34a56cf97c52b277
3
  size 5240
whisper-tiny-hi-checkpoint-1/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 58.31498729889923,
3
- "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-80",
4
- "epoch": 6.25,
5
  "eval_steps": 40,
6
  "global_step": 200,
7
  "is_hyper_param_search": false,
@@ -9,128 +9,128 @@
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.625,
13
- "grad_norm": 8.544885635375977,
14
  "learning_rate": 3.75e-05,
15
- "loss": 1.8228,
16
  "step": 20
17
  },
18
  {
19
- "epoch": 1.25,
20
- "grad_norm": 6.32118558883667,
21
  "learning_rate": 3.75e-05,
22
- "loss": 0.6803,
23
  "step": 40
24
  },
25
  {
26
- "epoch": 1.25,
27
- "eval_loss": 0.6102083325386047,
28
- "eval_runtime": 542.5987,
29
- "eval_samples_per_second": 1.843,
30
- "eval_steps_per_second": 1.843,
31
- "eval_wer": 65.94411515664692,
32
  "step": 40
33
  },
34
  {
35
- "epoch": 1.875,
36
- "grad_norm": 6.4600510597229,
37
  "learning_rate": 3.75e-05,
38
- "loss": 0.4966,
39
  "step": 60
40
  },
41
  {
42
- "epoch": 2.5,
43
- "grad_norm": 5.194849491119385,
44
  "learning_rate": 3.75e-05,
45
- "loss": 0.3649,
46
  "step": 80
47
  },
48
  {
49
- "epoch": 2.5,
50
- "eval_loss": 0.5036975741386414,
51
- "eval_runtime": 540.6408,
52
- "eval_samples_per_second": 1.85,
53
- "eval_steps_per_second": 1.85,
54
- "eval_wer": 58.31498729889923,
55
  "step": 80
56
  },
57
  {
58
- "epoch": 3.125,
59
- "grad_norm": 4.111001014709473,
60
  "learning_rate": 3.75e-05,
61
- "loss": 0.3075,
62
  "step": 100
63
  },
64
  {
65
- "epoch": 3.75,
66
- "grad_norm": 4.358007431030273,
67
  "learning_rate": 3.75e-05,
68
- "loss": 0.2296,
69
  "step": 120
70
  },
71
  {
72
- "epoch": 3.75,
73
- "eval_loss": 0.48966631293296814,
74
- "eval_runtime": 538.04,
75
- "eval_samples_per_second": 1.859,
76
- "eval_steps_per_second": 1.859,
77
- "eval_wer": 66.71464860287891,
78
  "step": 120
79
  },
80
  {
81
- "epoch": 4.375,
82
- "grad_norm": 4.111566066741943,
83
  "learning_rate": 3.75e-05,
84
- "loss": 0.1811,
85
  "step": 140
86
  },
87
  {
88
- "epoch": 5.0,
89
- "grad_norm": 6.702174186706543,
90
  "learning_rate": 3.75e-05,
91
- "loss": 0.1564,
92
  "step": 160
93
  },
94
  {
95
- "epoch": 5.0,
96
- "eval_loss": 0.5130774974822998,
97
- "eval_runtime": 529.7879,
98
- "eval_samples_per_second": 1.888,
99
- "eval_steps_per_second": 1.888,
100
- "eval_wer": 65.34292972057578,
101
  "step": 160
102
  },
103
  {
104
- "epoch": 5.625,
105
- "grad_norm": 3.0882856845855713,
106
  "learning_rate": 3.75e-05,
107
- "loss": 0.101,
108
  "step": 180
109
  },
110
  {
111
- "epoch": 6.25,
112
- "grad_norm": 4.524318695068359,
113
  "learning_rate": 3.75e-05,
114
- "loss": 0.0905,
115
  "step": 200
116
  },
117
  {
118
- "epoch": 6.25,
119
- "eval_loss": 0.5503659248352051,
120
- "eval_runtime": 587.5545,
121
- "eval_samples_per_second": 1.702,
122
- "eval_steps_per_second": 1.702,
123
- "eval_wer": 63.903471634208294,
124
  "step": 200
125
  },
126
  {
127
- "epoch": 6.25,
128
  "step": 200,
129
- "total_flos": 1.5401574531072e+17,
130
- "train_loss": 0.44307032763957976,
131
- "train_runtime": 3561.8571,
132
- "train_samples_per_second": 1.797,
133
- "train_steps_per_second": 0.056
134
  }
135
  ],
136
  "logging_steps": 20,
@@ -150,8 +150,8 @@
150
  "attributes": {}
151
  }
152
  },
153
- "total_flos": 1.5401574531072e+17,
154
- "train_batch_size": 32,
155
  "trial_name": null,
156
  "trial_params": null
157
  }
 
1
  {
2
+ "best_metric": 59.720575783234544,
3
+ "best_model_checkpoint": "./whisper-tiny-hi2_test/checkpoint-120",
4
+ "epoch": 6.349206349206349,
5
  "eval_steps": 40,
6
  "global_step": 200,
7
  "is_hyper_param_search": false,
 
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.6349206349206349,
13
+ "grad_norm": 8.253315925598145,
14
  "learning_rate": 3.75e-05,
15
+ "loss": 1.7555,
16
  "step": 20
17
  },
18
  {
19
+ "epoch": 1.2698412698412698,
20
+ "grad_norm": 6.022846698760986,
21
  "learning_rate": 3.75e-05,
22
+ "loss": 0.6766,
23
  "step": 40
24
  },
25
  {
26
+ "epoch": 1.2698412698412698,
27
+ "eval_loss": 0.6153799295425415,
28
+ "eval_runtime": 368.3001,
29
+ "eval_samples_per_second": 2.715,
30
+ "eval_steps_per_second": 0.679,
31
+ "eval_wer": 81.47332768839966,
32
  "step": 40
33
  },
34
  {
35
+ "epoch": 1.9047619047619047,
36
+ "grad_norm": 6.249065399169922,
37
  "learning_rate": 3.75e-05,
38
+ "loss": 0.4907,
39
  "step": 60
40
  },
41
  {
42
+ "epoch": 2.5396825396825395,
43
+ "grad_norm": 5.881297588348389,
44
  "learning_rate": 3.75e-05,
45
+ "loss": 0.3599,
46
  "step": 80
47
  },
48
  {
49
+ "epoch": 2.5396825396825395,
50
+ "eval_loss": 0.5078147649765015,
51
+ "eval_runtime": 314.278,
52
+ "eval_samples_per_second": 3.182,
53
+ "eval_steps_per_second": 0.795,
54
+ "eval_wer": 67.01100762066045,
55
  "step": 80
56
  },
57
  {
58
+ "epoch": 3.1746031746031744,
59
+ "grad_norm": 4.2090606689453125,
60
  "learning_rate": 3.75e-05,
61
+ "loss": 0.301,
62
  "step": 100
63
  },
64
  {
65
+ "epoch": 3.8095238095238093,
66
+ "grad_norm": 4.868574142456055,
67
  "learning_rate": 3.75e-05,
68
+ "loss": 0.2297,
69
  "step": 120
70
  },
71
  {
72
+ "epoch": 3.8095238095238093,
73
+ "eval_loss": 0.49397116899490356,
74
+ "eval_runtime": 304.836,
75
+ "eval_samples_per_second": 3.28,
76
+ "eval_steps_per_second": 0.82,
77
+ "eval_wer": 59.720575783234544,
78
  "step": 120
79
  },
80
  {
81
+ "epoch": 4.444444444444445,
82
+ "grad_norm": 4.324865341186523,
83
  "learning_rate": 3.75e-05,
84
+ "loss": 0.1754,
85
  "step": 140
86
  },
87
  {
88
+ "epoch": 5.079365079365079,
89
+ "grad_norm": 3.0074007511138916,
90
  "learning_rate": 3.75e-05,
91
+ "loss": 0.153,
92
  "step": 160
93
  },
94
  {
95
+ "epoch": 5.079365079365079,
96
+ "eval_loss": 0.5192885994911194,
97
+ "eval_runtime": 309.7886,
98
+ "eval_samples_per_second": 3.228,
99
+ "eval_steps_per_second": 0.807,
100
+ "eval_wer": 62.07451312447078,
101
  "step": 160
102
  },
103
  {
104
+ "epoch": 5.714285714285714,
105
+ "grad_norm": 2.9954638481140137,
106
  "learning_rate": 3.75e-05,
107
+ "loss": 0.1049,
108
  "step": 180
109
  },
110
  {
111
+ "epoch": 6.349206349206349,
112
+ "grad_norm": 3.4090383052825928,
113
  "learning_rate": 3.75e-05,
114
+ "loss": 0.0885,
115
  "step": 200
116
  },
117
  {
118
+ "epoch": 6.349206349206349,
119
+ "eval_loss": 0.5557394027709961,
120
+ "eval_runtime": 308.2851,
121
+ "eval_samples_per_second": 3.244,
122
+ "eval_steps_per_second": 0.811,
123
+ "eval_wer": 60.584250635055035,
124
  "step": 200
125
  },
126
  {
127
+ "epoch": 6.349206349206349,
128
  "step": 200,
129
+ "total_flos": 1.5637915828224e+17,
130
+ "train_loss": 0.4335097998380661,
131
+ "train_runtime": 2402.3095,
132
+ "train_samples_per_second": 2.664,
133
+ "train_steps_per_second": 0.083
134
  }
135
  ],
136
  "logging_steps": 20,
 
150
  "attributes": {}
151
  }
152
  },
153
+ "total_flos": 1.5637915828224e+17,
154
+ "train_batch_size": 16,
155
  "trial_name": null,
156
  "trial_params": null
157
  }
whisper-tiny-hi-checkpoint-2/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:802a25ee7db91faba0d8c4d8ea560053183efcadf455712cb855292076f680e4
3
+ size 151099494
whisper-tiny-hi-checkpoint-2/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:549ce3613e0053502a77050b29a76987037c7c15586538493db5d847eb76fe1c
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9287bb38beb16bf58664c3ed10f735c1bd05dd62bb178cf34a56cf97c52b277
3
  size 5240