m3hrdadfi commited on
Commit
942e89b
1 Parent(s): c3673ca

Hello hubert

Browse files
Files changed (5) hide show
  1. config.json +86 -0
  2. preprocessor_config.json +9 -0
  3. pytorch_model.bin +3 -0
  4. test.csv +122 -0
  5. trainer_state.json +85 -0
config.json ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "facebook/hubert-base-ls960",
3
+ "activation_dropout": 0.1,
4
+ "apply_spec_augment": true,
5
+ "architectures": [
6
+ "HubertForSpeechClassification"
7
+ ],
8
+ "attention_dropout": 0.1,
9
+ "bos_token_id": 1,
10
+ "conv_bias": false,
11
+ "conv_dim": [
12
+ 512,
13
+ 512,
14
+ 512,
15
+ 512,
16
+ 512,
17
+ 512,
18
+ 512
19
+ ],
20
+ "conv_kernel": [
21
+ 10,
22
+ 3,
23
+ 3,
24
+ 3,
25
+ 3,
26
+ 2,
27
+ 2
28
+ ],
29
+ "conv_stride": [
30
+ 5,
31
+ 2,
32
+ 2,
33
+ 2,
34
+ 2,
35
+ 2,
36
+ 2
37
+ ],
38
+ "ctc_loss_reduction": "sum",
39
+ "ctc_zero_infinity": false,
40
+ "do_stable_layer_norm": false,
41
+ "eos_token_id": 2,
42
+ "feat_extract_activation": "gelu",
43
+ "feat_extract_dropout": 0.0,
44
+ "feat_extract_norm": "group",
45
+ "feat_proj_dropout": 0.1,
46
+ "final_dropout": 0.1,
47
+ "finetuning_task": "wav2vec2_clf",
48
+ "gradient_checkpointing": false,
49
+ "hidden_act": "gelu",
50
+ "hidden_dropout": 0.1,
51
+ "hidden_dropout_prob": 0.1,
52
+ "hidden_size": 768,
53
+ "id2label": {
54
+ "0": "anger",
55
+ "1": "disgust",
56
+ "2": "fear",
57
+ "3": "happiness",
58
+ "4": "sadness"
59
+ },
60
+ "initializer_range": 0.02,
61
+ "intermediate_size": 3072,
62
+ "label2id": {
63
+ "anger": 0,
64
+ "disgust": 1,
65
+ "fear": 2,
66
+ "happiness": 3,
67
+ "sadness": 4
68
+ },
69
+ "layer_norm_eps": 1e-05,
70
+ "layerdrop": 0.1,
71
+ "mask_feature_length": 10,
72
+ "mask_feature_prob": 0.0,
73
+ "mask_time_length": 10,
74
+ "mask_time_prob": 0.05,
75
+ "model_type": "hubert",
76
+ "num_attention_heads": 12,
77
+ "num_conv_pos_embedding_groups": 16,
78
+ "num_conv_pos_embeddings": 128,
79
+ "num_feat_extract_layers": 7,
80
+ "num_hidden_layers": 12,
81
+ "pad_token_id": 0,
82
+ "pooling_mode": "mean",
83
+ "problem_type": "single_label_classification",
84
+ "transformers_version": "4.7.0.dev0",
85
+ "vocab_size": 32
86
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0,
7
+ "return_attention_mask": false,
8
+ "sampling_rate": 16000
9
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4f2ef3453ebf232bc8fc7929782dc57d94c5ae5fed93d7b3a1482c029da3e9c
3
+ size 379949267
test.csv ADDED
@@ -0,0 +1,122 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name path emotion
2
+ d17 (2) /content/data/aesdd/disgust/d17 (2).wav disgust
3
+ s15 (2) /content/data/aesdd/sadness/s15 (2).wav sadness
4
+ a03 (2) /content/data/aesdd/anger/a03 (2).wav anger
5
+ s07 (5) /content/data/aesdd/sadness/s07 (5).wav sadness
6
+ h07 (2) /content/data/aesdd/happiness/h07 (2).wav happiness
7
+ f08 (4) /content/data/aesdd/fear/f08 (4).wav fear
8
+ f19 (1) /content/data/aesdd/fear/f19 (1).wav fear
9
+ s15 (4) /content/data/aesdd/sadness/s15 (4).wav sadness
10
+ f12 (5) /content/data/aesdd/fear/f12 (5).wav fear
11
+ s04 (6) /content/data/aesdd/sadness/s04 (6).wav sadness
12
+ a15 (4) /content/data/aesdd/anger/a15 (4).wav anger
13
+ h13 (5) /content/data/aesdd/happiness/h13 (5).wav happiness
14
+ d11 (6) /content/data/aesdd/disgust/d11 (6).wav disgust
15
+ a09 (6) /content/data/aesdd/anger/a09 (6).wav anger
16
+ h03 (1) /content/data/aesdd/happiness/h03 (1).wav happiness
17
+ s17 (6) /content/data/aesdd/sadness/s17 (6).wav sadness
18
+ d15 (5) /content/data/aesdd/disgust/d15 (5).wav disgust
19
+ s13 (4) /content/data/aesdd/sadness/s13 (4).wav sadness
20
+ f15 (3) /content/data/aesdd/fear/f15 (3).wav fear
21
+ h05 (3) /content/data/aesdd/happiness/h05 (3).wav happiness
22
+ s16 (4) /content/data/aesdd/sadness/s16 (4).wav sadness
23
+ f01 (6) /content/data/aesdd/fear/f01 (6).wav fear
24
+ d01 (1) /content/data/aesdd/disgust/d01 (1).wav disgust
25
+ d11 (5) /content/data/aesdd/disgust/d11 (5).wav disgust
26
+ a20 (3) /content/data/aesdd/anger/a20 (3).wav anger
27
+ a13 (5) /content/data/aesdd/anger/a13 (5).wav anger
28
+ a01 (2) /content/data/aesdd/anger/a01 (2).wav anger
29
+ f14 (4) /content/data/aesdd/fear/f14 (4).wav fear
30
+ a05 (3) /content/data/aesdd/anger/a05 (3).wav anger
31
+ h04 (5) /content/data/aesdd/happiness/h04 (5).wav happiness
32
+ h05 (4) /content/data/aesdd/happiness/h05 (4).wav happiness
33
+ f15 (4) /content/data/aesdd/fear/f15 (4).wav fear
34
+ h03 (3) /content/data/aesdd/happiness/h03 (3).wav happiness
35
+ f18 (4) /content/data/aesdd/fear/f18 (4).wav fear
36
+ f16 (3) /content/data/aesdd/fear/f16 (3).wav fear
37
+ d13 (5) /content/data/aesdd/disgust/d13 (5).wav disgust
38
+ a15 (2) /content/data/aesdd/anger/a15 (2).wav anger
39
+ a10 (6) /content/data/aesdd/anger/a10 (6).wav anger
40
+ a14 (1) /content/data/aesdd/anger/a14 (1).wav anger
41
+ d18 (1) /content/data/aesdd/disgust/d18 (1).wav disgust
42
+ f13 (01) /content/data/aesdd/fear/f13 (01).wav fear
43
+ h05 (1) /content/data/aesdd/happiness/h05 (1).wav happiness
44
+ h08 (4) /content/data/aesdd/happiness/h08 (4).wav happiness
45
+ f11 (01) /content/data/aesdd/fear/f11 (01).wav fear
46
+ s17 (5) /content/data/aesdd/sadness/s17 (5).wav sadness
47
+ d04 (2) /content/data/aesdd/disgust/d04 (2).wav disgust
48
+ d18 (4) /content/data/aesdd/disgust/d18 (4).wav disgust
49
+ h04 (6) /content/data/aesdd/happiness/h04 (6).wav happiness
50
+ s19 (1) /content/data/aesdd/sadness/s19 (1).wav sadness
51
+ a06 (5)b /content/data/aesdd/anger/a06 (5)b.wav anger
52
+ d14 (2) /content/data/aesdd/disgust/d14 (2).wav disgust
53
+ f09 (6) /content/data/aesdd/fear/f09 (6).wav fear
54
+ f17 (4) /content/data/aesdd/fear/f17 (4).wav fear
55
+ a06 (6) /content/data/aesdd/anger/a06 (6).wav anger
56
+ d08 (2) /content/data/aesdd/disgust/d08 (2).wav disgust
57
+ h07 (4) /content/data/aesdd/happiness/h07 (4).wav happiness
58
+ d09 (3) /content/data/aesdd/disgust/d09 (3).wav disgust
59
+ a12 (4) /content/data/aesdd/anger/a12 (4).wav anger
60
+ s07 (3) /content/data/aesdd/sadness/s07 (3).wav sadness
61
+ f16 (6) /content/data/aesdd/fear/f16 (6).wav fear
62
+ f13 (5) /content/data/aesdd/fear/f13 (5).wav fear
63
+ d17 (4) /content/data/aesdd/disgust/d17 (4).wav disgust
64
+ s07 (1) /content/data/aesdd/sadness/s07 (1).wav sadness
65
+ f02 (1) /content/data/aesdd/fear/f02 (1).wav fear
66
+ h10 (1) /content/data/aesdd/happiness/h10 (1).wav happiness
67
+ h10 (2) /content/data/aesdd/happiness/h10 (2).wav happiness
68
+ s04 (1) /content/data/aesdd/sadness/s04 (1).wav sadness
69
+ d10 (6) /content/data/aesdd/disgust/d10 (6).wav disgust
70
+ a04 (2) /content/data/aesdd/anger/a04 (2).wav anger
71
+ a18 (2) /content/data/aesdd/anger/a18 (2).wav anger
72
+ a18 (6) /content/data/aesdd/anger/a18 (6).wav anger
73
+ s12 (2) /content/data/aesdd/sadness/s12 (2).wav sadness
74
+ s15 (5) /content/data/aesdd/sadness/s15 (5).wav sadness
75
+ a08 (1) /content/data/aesdd/anger/a08 (1).wav anger
76
+ d02 (2) /content/data/aesdd/disgust/d02 (2).wav disgust
77
+ h12 (4) /content/data/aesdd/happiness/h12 (4).wav happiness
78
+ h08 (3) /content/data/aesdd/happiness/h08 (3).wav happiness
79
+ s10 (2) /content/data/aesdd/sadness/s10 (2).wav sadness
80
+ f19 (2) /content/data/aesdd/fear/f19 (2).wav fear
81
+ s10 (5) /content/data/aesdd/sadness/s10 (5).wav sadness
82
+ h09 (4) /content/data/aesdd/happiness/h09 (4).wav happiness
83
+ s13 (6) /content/data/aesdd/sadness/s13 (6).wav sadness
84
+ h18 (2) /content/data/aesdd/happiness/h18 (2).wav happiness
85
+ d03 (5) /content/data/aesdd/disgust/d03 (5).wav disgust
86
+ d14 (1) /content/data/aesdd/disgust/d14 (1).wav disgust
87
+ s02 (3) /content/data/aesdd/sadness/s02 (3).wav sadness
88
+ f14 (1) /content/data/aesdd/fear/f14 (1).wav fear
89
+ a01 (3) /content/data/aesdd/anger/a01 (3).wav anger
90
+ a07 (3) /content/data/aesdd/anger/a07 (3).wav anger
91
+ f17 (1) /content/data/aesdd/fear/f17 (1).wav fear
92
+ h14 (2) /content/data/aesdd/happiness/h14 (2).wav happiness
93
+ d01 (6) /content/data/aesdd/disgust/d01 (6).wav disgust
94
+ s01 (1) /content/data/aesdd/sadness/s01 (1).wav sadness
95
+ s17 (3) /content/data/aesdd/sadness/s17 (3).wav sadness
96
+ f15 (5) /content/data/aesdd/fear/f15 (5).wav fear
97
+ h01 (4) /content/data/aesdd/happiness/h01 (4).wav happiness
98
+ s09 (1) /content/data/aesdd/sadness/s09 (1).wav sadness
99
+ f06 (5) /content/data/aesdd/fear/f06 (5).wav fear
100
+ d05 (6) /content/data/aesdd/disgust/d05 (6).wav disgust
101
+ a08 (2) /content/data/aesdd/anger/a08 (2).wav anger
102
+ s13 (2) /content/data/aesdd/sadness/s13 (2).wav sadness
103
+ d18 (2) /content/data/aesdd/disgust/d18 (2).wav disgust
104
+ a09 (2) /content/data/aesdd/anger/a09 (2).wav anger
105
+ f05 (6) /content/data/aesdd/fear/f05 (6).wav fear
106
+ s04 (5) /content/data/aesdd/sadness/s04 (5).wav sadness
107
+ h06 (5) /content/data/aesdd/happiness/h06 (5).wav happiness
108
+ a14 (6) /content/data/aesdd/anger/a14 (6).wav anger
109
+ a13 (2) /content/data/aesdd/anger/a13 (2).wav anger
110
+ h10 (5) /content/data/aesdd/happiness/h10 (5).wav happiness
111
+ a13 (1) /content/data/aesdd/anger/a13 (1).wav anger
112
+ d12 (3) /content/data/aesdd/disgust/d12 (3).wav disgust
113
+ h18 (3) /content/data/aesdd/happiness/h18 (3).wav happiness
114
+ d15 (1) /content/data/aesdd/disgust/d15 (1).wav disgust
115
+ h19 (3) /content/data/aesdd/happiness/h19 (3).wav happiness
116
+ s05 (4) /content/data/aesdd/sadness/s05 (4).wav sadness
117
+ d17 (6) /content/data/aesdd/disgust/d17 (6).wav disgust
118
+ d12 (2) /content/data/aesdd/disgust/d12 (2).wav disgust
119
+ s06 (4) /content/data/aesdd/sadness/s06 (4).wav sadness
120
+ f19 (3) /content/data/aesdd/fear/f19 (3).wav fear
121
+ f09 (2) /content/data/aesdd/fear/f09 (2).wav fear
122
+ h08 (2) /content/data/aesdd/happiness/h08 (2).wav happiness
trainer_state.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 6.991735537190083,
5
+ "global_step": 420,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 1.66,
12
+ "learning_rate": 7.619047619047618e-05,
13
+ "loss": 1.2894,
14
+ "step": 100
15
+ },
16
+ {
17
+ "epoch": 1.66,
18
+ "eval_accuracy": 0.4958677589893341,
19
+ "eval_loss": 1.2452681064605713,
20
+ "eval_runtime": 7.5077,
21
+ "eval_samples_per_second": 16.117,
22
+ "eval_steps_per_second": 4.129,
23
+ "step": 100
24
+ },
25
+ {
26
+ "epoch": 3.33,
27
+ "learning_rate": 5.285714285714286e-05,
28
+ "loss": 0.7978,
29
+ "step": 200
30
+ },
31
+ {
32
+ "epoch": 3.33,
33
+ "eval_accuracy": 0.7768595218658447,
34
+ "eval_loss": 0.746031641960144,
35
+ "eval_runtime": 7.1743,
36
+ "eval_samples_per_second": 16.866,
37
+ "eval_steps_per_second": 4.321,
38
+ "step": 200
39
+ },
40
+ {
41
+ "epoch": 4.99,
42
+ "learning_rate": 2.9047619047619052e-05,
43
+ "loss": 0.4372,
44
+ "step": 300
45
+ },
46
+ {
47
+ "epoch": 4.99,
48
+ "eval_accuracy": 0.9008264541625977,
49
+ "eval_loss": 0.3735601603984833,
50
+ "eval_runtime": 7.2008,
51
+ "eval_samples_per_second": 16.804,
52
+ "eval_steps_per_second": 4.305,
53
+ "step": 300
54
+ },
55
+ {
56
+ "epoch": 6.66,
57
+ "learning_rate": 5.4761904761904765e-06,
58
+ "loss": 0.246,
59
+ "step": 400
60
+ },
61
+ {
62
+ "epoch": 6.66,
63
+ "eval_accuracy": 0.9504132270812988,
64
+ "eval_loss": 0.24308893084526062,
65
+ "eval_runtime": 10.0989,
66
+ "eval_samples_per_second": 11.982,
67
+ "eval_steps_per_second": 3.07,
68
+ "step": 400
69
+ },
70
+ {
71
+ "epoch": 6.99,
72
+ "step": 420,
73
+ "total_flos": 1.8354201823649805e+17,
74
+ "train_loss": 0.6664659727187384,
75
+ "train_runtime": 440.1582,
76
+ "train_samples_per_second": 7.681,
77
+ "train_steps_per_second": 0.954
78
+ }
79
+ ],
80
+ "max_steps": 420,
81
+ "num_train_epochs": 7,
82
+ "total_flos": 1.8354201823649805e+17,
83
+ "trial_name": null,
84
+ "trial_params": null
85
+ }