muratsimsek003 commited on
Commit
1ce5cae
1 Parent(s): b6f84e2

Training in progress, step 20

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "activation_dropout": 0.05,
3
  "adapter_attn_dim": 64,
4
  "adapter_kernel_size": 3,
5
  "adapter_stride": 2,
@@ -8,7 +8,7 @@
8
  "architectures": [
9
  "Wav2Vec2ForCTC"
10
  ],
11
- "attention_dropout": 0.05,
12
  "bos_token_id": 1,
13
  "classifier_proj_size": 256,
14
  "codevector_dim": 768,
@@ -49,23 +49,23 @@
49
  "feat_extract_activation": "gelu",
50
  "feat_extract_dropout": 0.0,
51
  "feat_extract_norm": "layer",
52
- "feat_proj_dropout": 0.05,
53
  "feat_quantizer_dropout": 0.0,
54
- "final_dropout": 0.05,
55
  "gradient_checkpointing": false,
56
  "hidden_act": "gelu",
57
- "hidden_dropout": 0.1,
58
  "hidden_size": 1024,
59
  "initializer_range": 0.02,
60
  "intermediate_size": 4096,
61
  "layer_norm_eps": 1e-05,
62
- "layerdrop": 0.1,
63
  "mask_feature_length": 10,
64
  "mask_feature_min_masks": 0,
65
- "mask_feature_prob": 0.05,
66
  "mask_time_length": 10,
67
  "mask_time_min_masks": 2,
68
- "mask_time_prob": 0.1,
69
  "model_type": "wav2vec2",
70
  "num_adapter_layers": 3,
71
  "num_attention_heads": 16,
 
1
  {
2
+ "activation_dropout": 0.0,
3
  "adapter_attn_dim": 64,
4
  "adapter_kernel_size": 3,
5
  "adapter_stride": 2,
 
8
  "architectures": [
9
  "Wav2Vec2ForCTC"
10
  ],
11
+ "attention_dropout": 0.0,
12
  "bos_token_id": 1,
13
  "classifier_proj_size": 256,
14
  "codevector_dim": 768,
 
49
  "feat_extract_activation": "gelu",
50
  "feat_extract_dropout": 0.0,
51
  "feat_extract_norm": "layer",
52
+ "feat_proj_dropout": 0.0,
53
  "feat_quantizer_dropout": 0.0,
54
+ "final_dropout": 0.0,
55
  "gradient_checkpointing": false,
56
  "hidden_act": "gelu",
57
+ "hidden_dropout": 0.0,
58
  "hidden_size": 1024,
59
  "initializer_range": 0.02,
60
  "intermediate_size": 4096,
61
  "layer_norm_eps": 1e-05,
62
+ "layerdrop": 0.0,
63
  "mask_feature_length": 10,
64
  "mask_feature_min_masks": 0,
65
+ "mask_feature_prob": 0.0,
66
  "mask_time_length": 10,
67
  "mask_time_min_masks": 2,
68
+ "mask_time_prob": 0.075,
69
  "model_type": "wav2vec2",
70
  "num_adapter_layers": 3,
71
  "num_attention_heads": 16,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:58514a40e5f3eaff56bbbc2317efacc7037d831303a58bfd368a4fc2d5af529b
3
  size 1274889840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69b24ab30d7e68a19d91bf1153a7db14fbc99ca2ce42ae99b9e1ccc7770541ec
3
  size 1274889840
runs/Aug20_08-42-56_9aaae1e40cf3/events.out.tfevents.1724143531.9aaae1e40cf3.3167.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3272ab875aa600113f3f032668a825985a40f132177ccfcf003908a7db239261
3
+ size 6911
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:400fda15c81d0ae58221ce51ca3ccd1c78bcca629d39cfb50b8f0a786f1f03e0
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:658cabcb557e2c3b4e7ad5b6c21399142dd31da356e3d772aae87c8642b60946
3
  size 5240