Ojro commited on
Commit
5eefe1f
1 Parent(s): 2324502

End of training

Browse files
README.md CHANGED
@@ -38,12 +38,12 @@ More information needed
38
  The following hyperparameters were used during training:
39
  - learning_rate: 1e-05
40
  - train_batch_size: 32
41
- - eval_batch_size: 32
42
  - seed: 42
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
- - lr_scheduler_type: constant_with_warmup
45
- - lr_scheduler_warmup_steps: 50
46
- - training_steps: 1
47
  - mixed_precision_training: Native AMP
48
 
49
  ### Training results
 
38
  The following hyperparameters were used during training:
39
  - learning_rate: 1e-05
40
  - train_batch_size: 32
41
+ - eval_batch_size: 16
42
  - seed: 42
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
+ - lr_scheduler_type: linear
45
+ - lr_scheduler_warmup_steps: 500
46
+ - training_steps: 3
47
  - mixed_precision_training: Native AMP
48
 
49
  ### Training results
config.json CHANGED
@@ -25,20 +25,7 @@
25
  "encoder_layerdrop": 0.0,
26
  "encoder_layers": 4,
27
  "eos_token_id": 50257,
28
- "forced_decoder_ids": [
29
- [
30
- 1,
31
- 50259
32
- ],
33
- [
34
- 2,
35
- 50359
36
- ],
37
- [
38
- 3,
39
- 50363
40
- ]
41
- ],
42
  "init_std": 0.02,
43
  "is_encoder_decoder": true,
44
  "mask_feature_length": 10,
@@ -56,99 +43,10 @@
56
  "num_mel_bins": 80,
57
  "pad_token_id": 50257,
58
  "scale_embedding": false,
59
- "suppress_tokens": [
60
- 1,
61
- 2,
62
- 7,
63
- 8,
64
- 9,
65
- 10,
66
- 14,
67
- 25,
68
- 26,
69
- 27,
70
- 28,
71
- 29,
72
- 31,
73
- 58,
74
- 59,
75
- 60,
76
- 61,
77
- 62,
78
- 63,
79
- 90,
80
- 91,
81
- 92,
82
- 93,
83
- 359,
84
- 503,
85
- 522,
86
- 542,
87
- 873,
88
- 893,
89
- 902,
90
- 918,
91
- 922,
92
- 931,
93
- 1350,
94
- 1853,
95
- 1982,
96
- 2460,
97
- 2627,
98
- 3246,
99
- 3253,
100
- 3268,
101
- 3536,
102
- 3846,
103
- 3961,
104
- 4183,
105
- 4667,
106
- 6585,
107
- 6647,
108
- 7273,
109
- 9061,
110
- 9383,
111
- 10428,
112
- 10929,
113
- 11938,
114
- 12033,
115
- 12331,
116
- 12562,
117
- 13793,
118
- 14157,
119
- 14635,
120
- 15265,
121
- 15618,
122
- 16553,
123
- 16604,
124
- 18362,
125
- 18956,
126
- 20075,
127
- 21675,
128
- 22520,
129
- 26130,
130
- 26161,
131
- 26435,
132
- 28279,
133
- 29464,
134
- 31650,
135
- 32302,
136
- 32470,
137
- 36865,
138
- 42863,
139
- 47425,
140
- 49870,
141
- 50254,
142
- 50258,
143
- 50358,
144
- 50359,
145
- 50360,
146
- 50361,
147
- 50362
148
- ],
149
  "torch_dtype": "float32",
150
  "transformers_version": "4.35.2",
151
- "use_cache": false,
152
  "use_weighted_layer_sum": false,
153
  "vocab_size": 51865
154
  }
 
25
  "encoder_layerdrop": 0.0,
26
  "encoder_layers": 4,
27
  "eos_token_id": 50257,
28
+ "forced_decoder_ids": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
29
  "init_std": 0.02,
30
  "is_encoder_decoder": true,
31
  "mask_feature_length": 10,
 
43
  "num_mel_bins": 80,
44
  "pad_token_id": 50257,
45
  "scale_embedding": false,
46
+ "suppress_tokens": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
47
  "torch_dtype": "float32",
48
  "transformers_version": "4.35.2",
49
+ "use_cache": true,
50
  "use_weighted_layer_sum": false,
51
  "vocab_size": 51865
52
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:709f21504ce794231c93972d3b5f83ff3b78b75bdb3f0309f7e3f45d977f8489
3
  size 151061672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ea9d5b670a7f8f43e9d9c2038a4e26784a9b71188f8dcdfce63eb4f87b70c84
3
  size 151061672
runs/Nov27_11-13-54_icdcub-03/events.out.tfevents.1701083652.icdcub-03 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abb70362dae1a5836a16fd1c4c05f5d2aa193407bae491e6b479eda76a5b61fc
3
+ size 9928
runs/Nov27_11-15-45_icdcub-03/events.out.tfevents.1701083747.icdcub-03 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0bf24e8826464c5c5666c1eec8ba9a5d28a7791b3a714b2c34eb1906a8a7106
3
+ size 4984
runs/Nov27_11-17-02_icdcub-03/events.out.tfevents.1701083825.icdcub-03 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd0f0353fd6544f8583f4689e5948c05a68270769a280fe622833872e8a9938c
3
+ size 4984
runs/Nov27_11-19-46_icdcub-03/events.out.tfevents.1701083988.icdcub-03 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7065480b3b9959eac2c838067cc731acbe52d3c763aa1e0dae24befb2e30a888
3
+ size 4984
runs/Nov27_11-23-56_icdcub-03/events.out.tfevents.1701084238.icdcub-03 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55631932587db6acf6b56c526b283fc21bf134f4f6ce25483d8e31d53333a0c1
3
+ size 4984
runs/Nov27_11-38-13_icdcub-03/events.out.tfevents.1701085095.icdcub-03 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6eaea35ec8e0b174d794d0d33efbcd32be6a063680b9b243654b5bbe5f34e3db
3
+ size 9928
runs/Nov27_12-01-04_icdcub-03/events.out.tfevents.1701086466.icdcub-03 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99970e85c4afb787b7474c48106a2b858d8ceceabe6b17c0b6248a31c899497b
3
+ size 4984
runs/Nov27_12-06-08_icdcub-03/events.out.tfevents.1701086770.icdcub-03 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f5da58dc123b30f9f9492be7b25e83dd1fd4c18833ed93a70aba8e5a2aed434
3
+ size 5332
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f442d6a71b4265e615d0b6aeca32f9951b8fc8f39a153ef7804d63ba73c48d64
3
  size 4283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbb5036d00f0361d3086e8a8a32b898c56ca0393e4123619dde7a205aae63347
3
  size 4283