m3hrdadfi commited on
Commit
3718460
1 Parent(s): 0122f97

Initial model

Browse files
added_tokens.json ADDED
@@ -0,0 +1 @@
 
1
+ {"<s>": 55, "</s>": 56}
all_results.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 6.99,
3
+ "eval_accuracy": 0.9090909361839294,
4
+ "eval_loss": 0.305728554725647,
5
+ "eval_mem_cpu_alloc_delta": 3919872,
6
+ "eval_mem_cpu_peaked_delta": 0,
7
+ "eval_mem_gpu_alloc_delta": 0,
8
+ "eval_mem_gpu_peaked_delta": 713997824,
9
+ "eval_runtime": 17.2794,
10
+ "eval_samples": 121,
11
+ "eval_samples_per_second": 7.003,
12
+ "init_mem_cpu_alloc_delta": 1225068544,
13
+ "init_mem_cpu_peaked_delta": 0,
14
+ "init_mem_gpu_alloc_delta": 1265974272,
15
+ "init_mem_gpu_peaked_delta": 0,
16
+ "total_flos": 2.907298151590248e+16,
17
+ "train_mem_cpu_alloc_delta": -1273180160,
18
+ "train_mem_cpu_peaked_delta": 1291272192,
19
+ "train_mem_gpu_alloc_delta": 3793395712,
20
+ "train_mem_gpu_peaked_delta": 1175817728,
21
+ "train_runtime": 1331.4211,
22
+ "train_samples": 483,
23
+ "train_samples_per_second": 0.315
24
+ }
config.json ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "lighteternal/wav2vec2-large-xlsr-53-greek",
3
+ "activation_dropout": 0.0,
4
+ "apply_spec_augment": true,
5
+ "architectures": [
6
+ "Wav2Vec2ForSpeechClassification"
7
+ ],
8
+ "attention_dropout": 0.1,
9
+ "bos_token_id": 1,
10
+ "conv_bias": true,
11
+ "conv_dim": [
12
+ 512,
13
+ 512,
14
+ 512,
15
+ 512,
16
+ 512,
17
+ 512,
18
+ 512
19
+ ],
20
+ "conv_kernel": [
21
+ 10,
22
+ 3,
23
+ 3,
24
+ 3,
25
+ 3,
26
+ 2,
27
+ 2
28
+ ],
29
+ "conv_stride": [
30
+ 5,
31
+ 2,
32
+ 2,
33
+ 2,
34
+ 2,
35
+ 2,
36
+ 2
37
+ ],
38
+ "ctc_loss_reduction": "mean",
39
+ "ctc_zero_infinity": true,
40
+ "do_stable_layer_norm": true,
41
+ "eos_token_id": 2,
42
+ "feat_extract_activation": "gelu",
43
+ "feat_extract_dropout": 0.0,
44
+ "feat_extract_norm": "layer",
45
+ "feat_proj_dropout": 0.0,
46
+ "final_dropout": 0.0,
47
+ "finetuning_task": "wav2vec2_clf",
48
+ "gradient_checkpointing": true,
49
+ "hidden_act": "gelu",
50
+ "hidden_dropout": 0.1,
51
+ "hidden_size": 1024,
52
+ "id2label": {
53
+ "0": "anger",
54
+ "1": "disgust",
55
+ "2": "fear",
56
+ "3": "happiness",
57
+ "4": "sadness"
58
+ },
59
+ "initializer_range": 0.02,
60
+ "intermediate_size": 4096,
61
+ "label2id": {
62
+ "anger": 0,
63
+ "disgust": 1,
64
+ "fear": 2,
65
+ "happiness": 3,
66
+ "sadness": 4
67
+ },
68
+ "layer_norm_eps": 1e-05,
69
+ "layerdrop": 0.1,
70
+ "mask_channel_length": 10,
71
+ "mask_channel_min_space": 1,
72
+ "mask_channel_other": 0.0,
73
+ "mask_channel_prob": 0.0,
74
+ "mask_channel_selection": "static",
75
+ "mask_feature_length": 10,
76
+ "mask_feature_prob": 0.0,
77
+ "mask_time_length": 10,
78
+ "mask_time_min_space": 1,
79
+ "mask_time_other": 0.0,
80
+ "mask_time_prob": 0.05,
81
+ "mask_time_selection": "static",
82
+ "model_type": "wav2vec2",
83
+ "num_attention_heads": 16,
84
+ "num_conv_pos_embedding_groups": 16,
85
+ "num_conv_pos_embeddings": 128,
86
+ "num_feat_extract_layers": 7,
87
+ "num_hidden_layers": 24,
88
+ "pad_token_id": 54,
89
+ "pooling_mode": "mean",
90
+ "problem_type": "single_label_classification",
91
+ "transformers_version": "4.7.0.dev0",
92
+ "vocab_size": 55
93
+ }
eval_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 6.99,
3
+ "eval_accuracy": 0.9090909361839294,
4
+ "eval_loss": 0.305728554725647,
5
+ "eval_mem_cpu_alloc_delta": 3919872,
6
+ "eval_mem_cpu_peaked_delta": 0,
7
+ "eval_mem_gpu_alloc_delta": 0,
8
+ "eval_mem_gpu_peaked_delta": 713997824,
9
+ "eval_runtime": 17.2794,
10
+ "eval_samples": 121,
11
+ "eval_samples_per_second": 7.003
12
+ }
predict_results.txt ADDED
@@ -0,0 +1,122 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ index prediction
2
+ 0 disgust
3
+ 1 sadness
4
+ 2 anger
5
+ 3 sadness
6
+ 4 happiness
7
+ 5 fear
8
+ 6 fear
9
+ 7 sadness
10
+ 8 fear
11
+ 9 sadness
12
+ 10 anger
13
+ 11 fear
14
+ 12 disgust
15
+ 13 anger
16
+ 14 happiness
17
+ 15 sadness
18
+ 16 disgust
19
+ 17 sadness
20
+ 18 fear
21
+ 19 happiness
22
+ 20 sadness
23
+ 21 fear
24
+ 22 disgust
25
+ 23 disgust
26
+ 24 anger
27
+ 25 anger
28
+ 26 anger
29
+ 27 fear
30
+ 28 anger
31
+ 29 happiness
32
+ 30 happiness
33
+ 31 fear
34
+ 32 happiness
35
+ 33 fear
36
+ 34 fear
37
+ 35 disgust
38
+ 36 anger
39
+ 37 anger
40
+ 38 anger
41
+ 39 disgust
42
+ 40 fear
43
+ 41 happiness
44
+ 42 happiness
45
+ 43 fear
46
+ 44 sadness
47
+ 45 disgust
48
+ 46 disgust
49
+ 47 disgust
50
+ 48 sadness
51
+ 49 anger
52
+ 50 disgust
53
+ 51 fear
54
+ 52 fear
55
+ 53 anger
56
+ 54 disgust
57
+ 55 disgust
58
+ 56 disgust
59
+ 57 anger
60
+ 58 sadness
61
+ 59 happiness
62
+ 60 fear
63
+ 61 disgust
64
+ 62 sadness
65
+ 63 fear
66
+ 64 happiness
67
+ 65 anger
68
+ 66 sadness
69
+ 67 disgust
70
+ 68 anger
71
+ 69 anger
72
+ 70 anger
73
+ 71 sadness
74
+ 72 sadness
75
+ 73 anger
76
+ 74 disgust
77
+ 75 happiness
78
+ 76 happiness
79
+ 77 sadness
80
+ 78 fear
81
+ 79 sadness
82
+ 80 happiness
83
+ 81 sadness
84
+ 82 happiness
85
+ 83 disgust
86
+ 84 disgust
87
+ 85 sadness
88
+ 86 fear
89
+ 87 anger
90
+ 88 anger
91
+ 89 fear
92
+ 90 happiness
93
+ 91 disgust
94
+ 92 sadness
95
+ 93 sadness
96
+ 94 fear
97
+ 95 fear
98
+ 96 sadness
99
+ 97 disgust
100
+ 98 disgust
101
+ 99 anger
102
+ 100 sadness
103
+ 101 disgust
104
+ 102 anger
105
+ 103 sadness
106
+ 104 sadness
107
+ 105 disgust
108
+ 106 anger
109
+ 107 anger
110
+ 108 happiness
111
+ 109 anger
112
+ 110 fear
113
+ 111 happiness
114
+ 112 disgust
115
+ 113 anger
116
+ 114 sadness
117
+ 115 disgust
118
+ 116 disgust
119
+ 117 sadness
120
+ 118 fear
121
+ 119 fear
122
+ 120 happiness
preprocessor_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0.0,
7
+ "return_attention_mask": true,
8
+ "sampling_rate": 16000
9
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf6b07c9d1149043e4a37682bf9a1443c7b53263ec3407dd55bf831d85fa7c29
3
+ size 1266153513
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
test.csv ADDED
@@ -0,0 +1,122 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name path label
2
+ d01 (6) /content/data/aesdd/aesdd/disgust/d01 (6).wav disgust
3
+ s12 (5) /content/data/aesdd/aesdd/sadness/s12 (5).wav sadness
4
+ a07 (4) /content/data/aesdd/aesdd/anger/a07 (4).wav anger
5
+ s20 (4) /content/data/aesdd/aesdd/sadness/s20 (4).wav sadness
6
+ h13 (6) /content/data/aesdd/aesdd/happiness/h13 (6).wav happiness
7
+ f09 (6) /content/data/aesdd/aesdd/fear/f09 (6).wav fear
8
+ f19 (5) /content/data/aesdd/aesdd/fear/f19 (5).wav fear
9
+ s17 (4) /content/data/aesdd/aesdd/sadness/s17 (4).wav sadness
10
+ f20 (6) /content/data/aesdd/aesdd/fear/f20 (6).wav fear
11
+ s06 (6) /content/data/aesdd/aesdd/sadness/s06 (6).wav sadness
12
+ a04 (3) /content/data/aesdd/aesdd/anger/a04 (3).wav anger
13
+ h07 (3) /content/data/aesdd/aesdd/happiness/h07 (3).wav happiness
14
+ d02 (1) /content/data/aesdd/aesdd/disgust/d02 (1).wav disgust
15
+ a09 (4) /content/data/aesdd/aesdd/anger/a09 (4).wav anger
16
+ h01 (6) /content/data/aesdd/aesdd/happiness/h01 (6).wav happiness
17
+ s05 (2) /content/data/aesdd/aesdd/sadness/s05 (2).wav sadness
18
+ d12 (5) /content/data/aesdd/aesdd/disgust/d12 (5).wav disgust
19
+ s14 (4) /content/data/aesdd/aesdd/sadness/s14 (4).wav sadness
20
+ f16 (2) /content/data/aesdd/aesdd/fear/f16 (2).wav fear
21
+ h14 (5) /content/data/aesdd/aesdd/happiness/h14 (5).wav happiness
22
+ s09 (4) /content/data/aesdd/aesdd/sadness/s09 (4).wav sadness
23
+ f04 (3) /content/data/aesdd/aesdd/fear/f04 (3).wav fear
24
+ d01 (4) /content/data/aesdd/aesdd/disgust/d01 (4).wav disgust
25
+ d03 (3) /content/data/aesdd/aesdd/disgust/d03 (3).wav disgust
26
+ a10 (1) /content/data/aesdd/aesdd/anger/a10 (1).wav anger
27
+ a11 (2) /content/data/aesdd/aesdd/anger/a11 (2).wav anger
28
+ a11 (5) /content/data/aesdd/aesdd/anger/a11 (5).wav anger
29
+ f15 (2) /content/data/aesdd/aesdd/fear/f15 (2).wav fear
30
+ a03 (6) /content/data/aesdd/aesdd/anger/a03 (6).wav anger
31
+ h13 (1) /content/data/aesdd/aesdd/happiness/h13 (1).wav happiness
32
+ h05 (4) /content/data/aesdd/aesdd/happiness/h05 (4).wav happiness
33
+ f10 (3) /content/data/aesdd/aesdd/fear/f10 (3).wav fear
34
+ h17 (1) /content/data/aesdd/aesdd/happiness/h17 (1).wav happiness
35
+ f18 (2) /content/data/aesdd/aesdd/fear/f18 (2).wav fear
36
+ f05 (2) /content/data/aesdd/aesdd/fear/f05 (2).wav fear
37
+ d09 (2) /content/data/aesdd/aesdd/disgust/d09 (2).wav disgust
38
+ a08 (1) /content/data/aesdd/aesdd/anger/a08 (1).wav anger
39
+ a17 (3) /content/data/aesdd/aesdd/anger/a17 (3).wav anger
40
+ a02 (6) /content/data/aesdd/aesdd/anger/a02 (6).wav anger
41
+ d11 (6) /content/data/aesdd/aesdd/disgust/d11 (6).wav disgust
42
+ f17 (5) /content/data/aesdd/aesdd/fear/f17 (5).wav fear
43
+ h08 (2) /content/data/aesdd/aesdd/happiness/h08 (2).wav happiness
44
+ h01 (1) /content/data/aesdd/aesdd/happiness/h01 (1).wav happiness
45
+ f18 (5)b /content/data/aesdd/aesdd/fear/f18 (5)b.wav fear
46
+ s03 (2) /content/data/aesdd/aesdd/sadness/s03 (2).wav sadness
47
+ d14 (1) /content/data/aesdd/aesdd/disgust/d14 (1).wav disgust
48
+ d17 (3) /content/data/aesdd/aesdd/disgust/d17 (3).wav disgust
49
+ h16 (6) /content/data/aesdd/aesdd/happiness/h16 (6).wav happiness
50
+ s07 (3) /content/data/aesdd/aesdd/sadness/s07 (3).wav sadness
51
+ a06 (3) /content/data/aesdd/aesdd/anger/a06 (3).wav anger
52
+ d13 (5) /content/data/aesdd/aesdd/disgust/d13 (5).wav disgust
53
+ f12 (6) /content/data/aesdd/aesdd/fear/f12 (6).wav fear
54
+ f04 (6) /content/data/aesdd/aesdd/fear/f04 (6).wav fear
55
+ a10 (4) /content/data/aesdd/aesdd/anger/a10 (4).wav anger
56
+ d09 (1) /content/data/aesdd/aesdd/disgust/d09 (1).wav disgust
57
+ h20 (1) /content/data/aesdd/aesdd/happiness/h20 (1).wav happiness
58
+ d02 (3) /content/data/aesdd/aesdd/disgust/d02 (3).wav disgust
59
+ a05 (5) /content/data/aesdd/aesdd/anger/a05 (5).wav anger
60
+ s02 (1) /content/data/aesdd/aesdd/sadness/s02 (1).wav sadness
61
+ f04 (2) /content/data/aesdd/aesdd/fear/f04 (2).wav fear
62
+ f06 (2) /content/data/aesdd/aesdd/fear/f06 (2).wav fear
63
+ d20 (6) /content/data/aesdd/aesdd/disgust/d20 (6).wav disgust
64
+ s11 (4) /content/data/aesdd/aesdd/sadness/s11 (4).wav sadness
65
+ f08 (6) /content/data/aesdd/aesdd/fear/f08 (6).wav fear
66
+ h11 (5) /content/data/aesdd/aesdd/happiness/h11 (5).wav happiness
67
+ h18 (4) /content/data/aesdd/aesdd/happiness/h18 (4).wav happiness
68
+ s02 (4) /content/data/aesdd/aesdd/sadness/s02 (4).wav sadness
69
+ d20 (3) /content/data/aesdd/aesdd/disgust/d20 (3).wav disgust
70
+ a13 (2) /content/data/aesdd/aesdd/anger/a13 (2).wav anger
71
+ a18 (2) /content/data/aesdd/aesdd/anger/a18 (2).wav anger
72
+ a11 (4) /content/data/aesdd/aesdd/anger/a11 (4).wav anger
73
+ s09 (1) /content/data/aesdd/aesdd/sadness/s09 (1).wav sadness
74
+ s09 (6) /content/data/aesdd/aesdd/sadness/s09 (6).wav sadness
75
+ a19 (5) /content/data/aesdd/aesdd/anger/a19 (5).wav anger
76
+ d10 (5) /content/data/aesdd/aesdd/disgust/d10 (5).wav disgust
77
+ h05 (3) /content/data/aesdd/aesdd/happiness/h05 (3).wav happiness
78
+ h06 (6) /content/data/aesdd/aesdd/happiness/h06 (6).wav happiness
79
+ s04 (5) /content/data/aesdd/aesdd/sadness/s04 (5).wav sadness
80
+ f16 (6) /content/data/aesdd/aesdd/fear/f16 (6).wav fear
81
+ s16 (5) /content/data/aesdd/aesdd/sadness/s16 (5).wav sadness
82
+ h10 (4) /content/data/aesdd/aesdd/happiness/h10 (4).wav happiness
83
+ s01 (4) /content/data/aesdd/aesdd/sadness/s01 (4).wav sadness
84
+ h02 (1) /content/data/aesdd/aesdd/happiness/h02 (1).wav happiness
85
+ d16 (6) /content/data/aesdd/aesdd/disgust/d16 (6).wav disgust
86
+ d01 (5)b /content/data/aesdd/aesdd/disgust/d01 (5)b.wav disgust
87
+ s06 (4) /content/data/aesdd/aesdd/sadness/s06 (4).wav sadness
88
+ f20 (3) /content/data/aesdd/aesdd/fear/f20 (3).wav fear
89
+ a14 (2) /content/data/aesdd/aesdd/anger/a14 (2).wav anger
90
+ a12 (1) /content/data/aesdd/aesdd/anger/a12 (1).wav anger
91
+ f11 (4) /content/data/aesdd/aesdd/fear/f11 (4).wav fear
92
+ h07 (4) /content/data/aesdd/aesdd/happiness/h07 (4).wav happiness
93
+ d13 (3) /content/data/aesdd/aesdd/disgust/d13 (3).wav disgust
94
+ s07 (5) /content/data/aesdd/aesdd/sadness/s07 (5).wav sadness
95
+ s17 (5) /content/data/aesdd/aesdd/sadness/s17 (5).wav sadness
96
+ f11 (3) /content/data/aesdd/aesdd/fear/f11 (3).wav fear
97
+ h04 (2) /content/data/aesdd/aesdd/happiness/h04 (2).wav happiness
98
+ s02 (3) /content/data/aesdd/aesdd/sadness/s02 (3).wav sadness
99
+ f08 (5) /content/data/aesdd/aesdd/fear/f08 (5).wav fear
100
+ d01 (3) /content/data/aesdd/aesdd/disgust/d01 (3).wav disgust
101
+ a14 (5) /content/data/aesdd/aesdd/anger/a14 (5).wav anger
102
+ s03 (4) /content/data/aesdd/aesdd/sadness/s03 (4).wav sadness
103
+ d07 (2) /content/data/aesdd/aesdd/disgust/d07 (2).wav disgust
104
+ a14 (4) /content/data/aesdd/aesdd/anger/a14 (4).wav anger
105
+ f20 (2) /content/data/aesdd/aesdd/fear/f20 (2).wav fear
106
+ s17 (1) /content/data/aesdd/aesdd/sadness/s17 (1).wav sadness
107
+ h04 (1) /content/data/aesdd/aesdd/happiness/h04 (1).wav happiness
108
+ a17 (5) /content/data/aesdd/aesdd/anger/a17 (5).wav anger
109
+ a03 (1) /content/data/aesdd/aesdd/anger/a03 (1).wav anger
110
+ h16 (2) /content/data/aesdd/aesdd/happiness/h16 (2).wav happiness
111
+ a18 (3) /content/data/aesdd/aesdd/anger/a18 (3).wav anger
112
+ d07 (1) /content/data/aesdd/aesdd/disgust/d07 (1).wav disgust
113
+ h13 (4) /content/data/aesdd/aesdd/happiness/h13 (4).wav happiness
114
+ d05 (2) /content/data/aesdd/aesdd/disgust/d05 (2).wav disgust
115
+ h19 (2) /content/data/aesdd/aesdd/happiness/h19 (2).wav happiness
116
+ s10 (4) /content/data/aesdd/aesdd/sadness/s10 (4).wav sadness
117
+ d02 (6) /content/data/aesdd/aesdd/disgust/d02 (6).wav disgust
118
+ d07 (5) /content/data/aesdd/aesdd/disgust/d07 (5).wav disgust
119
+ s03 (6) /content/data/aesdd/aesdd/sadness/s03 (6).wav sadness
120
+ f12 (01) /content/data/aesdd/aesdd/fear/f12 (01).wav fear
121
+ f18 (4) /content/data/aesdd/aesdd/fear/f18 (4).wav fear
122
+ h06 (2) /content/data/aesdd/aesdd/happiness/h06 (2).wav happiness
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
1
+ {"unk_token": "[UNK]", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "[PAD]", "do_lower_case": false, "word_delimiter_token": "|", "special_tokens_map_file": "/content/cache/7583eec6f0fc5d29c5d19e109f1737ce0da6c2c4c27426590e235ea7a79499f8.a21d51735cf8667bcd610f057e88548d5d6a381401f6b4501a8bc6c1a9dc8498", "tokenizer_file": null, "name_or_path": "lighteternal/wav2vec2-large-xlsr-53-greek"}
train_results.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 6.99,
3
+ "init_mem_cpu_alloc_delta": 1225068544,
4
+ "init_mem_cpu_peaked_delta": 0,
5
+ "init_mem_gpu_alloc_delta": 1265974272,
6
+ "init_mem_gpu_peaked_delta": 0,
7
+ "total_flos": 2.907298151590248e+16,
8
+ "train_mem_cpu_alloc_delta": -1273180160,
9
+ "train_mem_cpu_peaked_delta": 1291272192,
10
+ "train_mem_gpu_alloc_delta": 3793395712,
11
+ "train_mem_gpu_peaked_delta": 1175817728,
12
+ "train_runtime": 1331.4211,
13
+ "train_samples": 483,
14
+ "train_samples_per_second": 0.315
15
+ }
trainer_state.json ADDED
@@ -0,0 +1,79 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 6.991735537190083,
5
+ "global_step": 420,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 1.66,
12
+ "learning_rate": 7.642857142857143e-05,
13
+ "loss": 1.3365,
14
+ "step": 100
15
+ },
16
+ {
17
+ "epoch": 1.66,
18
+ "eval_accuracy": 0.6363636255264282,
19
+ "eval_loss": 0.8412261605262756,
20
+ "eval_runtime": 17.1267,
21
+ "eval_samples_per_second": 7.065,
22
+ "step": 100
23
+ },
24
+ {
25
+ "epoch": 3.33,
26
+ "learning_rate": 5.285714285714286e-05,
27
+ "loss": 0.6421,
28
+ "step": 200
29
+ },
30
+ {
31
+ "epoch": 3.33,
32
+ "eval_accuracy": 0.8677685856819153,
33
+ "eval_loss": 0.4234764575958252,
34
+ "eval_runtime": 17.292,
35
+ "eval_samples_per_second": 6.997,
36
+ "step": 200
37
+ },
38
+ {
39
+ "epoch": 4.99,
40
+ "learning_rate": 2.9047619047619052e-05,
41
+ "loss": 0.3537,
42
+ "step": 300
43
+ },
44
+ {
45
+ "epoch": 4.99,
46
+ "eval_accuracy": 0.8429751992225647,
47
+ "eval_loss": 0.518673300743103,
48
+ "eval_runtime": 17.2657,
49
+ "eval_samples_per_second": 7.008,
50
+ "step": 300
51
+ },
52
+ {
53
+ "epoch": 6.66,
54
+ "learning_rate": 5.2380952380952384e-06,
55
+ "loss": 0.1469,
56
+ "step": 400
57
+ },
58
+ {
59
+ "epoch": 6.66,
60
+ "eval_accuracy": 0.9090909361839294,
61
+ "eval_loss": 0.3046664297580719,
62
+ "eval_runtime": 17.2878,
63
+ "eval_samples_per_second": 6.999,
64
+ "step": 400
65
+ },
66
+ {
67
+ "epoch": 6.99,
68
+ "step": 420,
69
+ "total_flos": 2.907298151590248e+16,
70
+ "train_runtime": 1331.4211,
71
+ "train_samples_per_second": 0.315
72
+ }
73
+ ],
74
+ "max_steps": 420,
75
+ "num_train_epochs": 7,
76
+ "total_flos": 2.907298151590248e+16,
77
+ "trial_name": null,
78
+ "trial_params": null
79
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80c58b17f666adf92166966fd5a7b22476ec660730d80d3b2609b416b7e64e57
3
+ size 2415
vocab.json ADDED
@@ -0,0 +1 @@
 
1
+ {"ψ": 0, "ρ": 1, "φ": 2, "π": 3, "m": 4, "ο": 5, "t": 6, "ϋ": 7, "σ": 8, "ϊ": 9, "g": 10, "´": 11, "e": 12, "ύ": 13, "ΐ": 14, "’": 15, "a": 16, "τ": 17, "δ": 18, "ζ": 19, "r": 20, "λ": 21, "θ": 22, "·": 23, "»": 24, "«": 25, "β": 26, "κ": 27, "ν": 28, "n": 29, "χ": 31, "η": 32, "γ": 33, "ά": 34, "ω": 35, "έ": 36, "ό": 37, "μ": 38, "ς": 39, "o": 40, "ξ": 41, "ή": 42, "ώ": 43, "ε": 44, "ι": 45, "h": 46, "α": 47, "ί": 48, "'": 49, "v": 50, "υ": 51, "́": 52, "|": 30, "[UNK]": 53, "[PAD]": 54}