Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +16 -10
- checkpoint-170/config.json +0 -4
- checkpoint-170/model.safetensors +1 -1
- checkpoint-170/optimizer.pt +1 -1
- checkpoint-170/scheduler.pt +1 -1
- checkpoint-170/trainer_state.json +20 -20
- checkpoint-170/training_args.bin +1 -1
- checkpoint-256/config.json +0 -4
- checkpoint-256/model.safetensors +1 -1
- checkpoint-256/optimizer.pt +1 -1
- checkpoint-256/scheduler.pt +1 -1
- checkpoint-256/trainer_state.json +28 -28
- checkpoint-256/training_args.bin +1 -1
- checkpoint-341/config.json +0 -4
- checkpoint-341/model.safetensors +1 -1
- checkpoint-341/optimizer.pt +1 -1
- checkpoint-341/trainer_state.json +32 -32
- checkpoint-341/training_args.bin +1 -1
- checkpoint-426/config.json +0 -4
- checkpoint-426/model.safetensors +1 -1
- checkpoint-426/optimizer.pt +1 -1
- checkpoint-426/scheduler.pt +1 -1
- checkpoint-426/trainer_state.json +44 -44
- checkpoint-426/training_args.bin +1 -1
- checkpoint-512/config.json +0 -4
- checkpoint-512/model.safetensors +1 -1
- checkpoint-512/optimizer.pt +1 -1
- checkpoint-512/scheduler.pt +1 -1
- checkpoint-512/trainer_state.json +51 -51
- checkpoint-512/training_args.bin +1 -1
- checkpoint-597/config.json +0 -4
- checkpoint-597/model.safetensors +1 -1
- checkpoint-597/optimizer.pt +1 -1
- checkpoint-597/scheduler.pt +1 -1
- checkpoint-597/trainer_state.json +60 -60
- checkpoint-597/training_args.bin +1 -1
- checkpoint-683/config.json +1 -4
- checkpoint-683/model.safetensors +1 -1
- checkpoint-683/optimizer.pt +1 -1
- checkpoint-683/scheduler.pt +1 -1
- checkpoint-683/trainer_state.json +69 -45
- checkpoint-683/training_args.bin +1 -1
- checkpoint-768/config.json +1 -4
- checkpoint-768/model.safetensors +1 -1
- checkpoint-768/optimizer.pt +1 -1
- checkpoint-768/scheduler.pt +1 -1
- checkpoint-768/trainer_state.json +78 -51
- checkpoint-768/training_args.bin +1 -1
- checkpoint-85/config.json +0 -4
- checkpoint-85/model.safetensors +1 -1
README.md
CHANGED
@@ -21,11 +21,11 @@ should probably proofread and complete it, then remove this comment. -->
|
|
21 |
|
22 |
This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on an unknown dataset.
|
23 |
It achieves the following results on the evaluation set:
|
24 |
-
- Loss: 0.
|
25 |
-
- Accuracy: 0.
|
26 |
-
- Precision: 0.
|
27 |
-
- Recall: 0.
|
28 |
-
- F1: 0.
|
29 |
|
30 |
## Model description
|
31 |
|
@@ -53,16 +53,22 @@ The following hyperparameters were used during training:
|
|
53 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
54 |
- lr_scheduler_type: cosine
|
55 |
- lr_scheduler_warmup_ratio: 0.001
|
56 |
-
- num_epochs:
|
57 |
|
58 |
### Training results
|
59 |
|
60 |
| Training Loss | Epoch | Step | Validation Loss | Accuracy | Precision | Recall | F1 |
|
61 |
|:-------------:|:------:|:----:|:---------------:|:--------:|:---------:|:------:|:------:|
|
62 |
-
| No log | 0.9956 | 85 | 0.
|
63 |
-
| No log | 1.9912 | 170 | 0.
|
64 |
-
| No log | 2.9985 | 256 | 0.
|
65 |
-
| No log | 3.
|
|
|
|
|
|
|
|
|
|
|
|
|
66 |
|
67 |
|
68 |
### Framework versions
|
|
|
21 |
|
22 |
This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on an unknown dataset.
|
23 |
It achieves the following results on the evaluation set:
|
24 |
+
- Loss: 0.0338
|
25 |
+
- Accuracy: 0.9912
|
26 |
+
- Precision: 0.9912
|
27 |
+
- Recall: 0.9912
|
28 |
+
- F1: 0.9912
|
29 |
|
30 |
## Model description
|
31 |
|
|
|
53 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
54 |
- lr_scheduler_type: cosine
|
55 |
- lr_scheduler_warmup_ratio: 0.001
|
56 |
+
- num_epochs: 10
|
57 |
|
58 |
### Training results
|
59 |
|
60 |
| Training Loss | Epoch | Step | Validation Loss | Accuracy | Precision | Recall | F1 |
|
61 |
|:-------------:|:------:|:----:|:---------------:|:--------:|:---------:|:------:|:------:|
|
62 |
+
| No log | 0.9956 | 85 | 0.1197 | 0.9538 | 0.9535 | 0.9538 | 0.9536 |
|
63 |
+
| No log | 1.9912 | 170 | 0.0601 | 0.9832 | 0.9831 | 0.9832 | 0.9831 |
|
64 |
+
| No log | 2.9985 | 256 | 0.0506 | 0.9868 | 0.9868 | 0.9868 | 0.9868 |
|
65 |
+
| No log | 3.9941 | 341 | 0.0461 | 0.9861 | 0.9864 | 0.9861 | 0.9862 |
|
66 |
+
| No log | 4.9898 | 426 | 0.0439 | 0.9890 | 0.9891 | 0.9890 | 0.9890 |
|
67 |
+
| 0.0779 | 5.9971 | 512 | 0.0396 | 0.9905 | 0.9905 | 0.9905 | 0.9905 |
|
68 |
+
| 0.0779 | 6.9927 | 597 | 0.0350 | 0.9919 | 0.9919 | 0.9919 | 0.9919 |
|
69 |
+
| 0.0779 | 8.0 | 683 | 0.0335 | 0.9912 | 0.9912 | 0.9912 | 0.9912 |
|
70 |
+
| 0.0779 | 8.9956 | 768 | 0.0337 | 0.9912 | 0.9912 | 0.9912 | 0.9912 |
|
71 |
+
| 0.0779 | 9.9561 | 850 | 0.0338 | 0.9912 | 0.9912 | 0.9912 | 0.9912 |
|
72 |
|
73 |
|
74 |
### Framework versions
|
checkpoint-170/config.json
CHANGED
@@ -55,10 +55,6 @@
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
58 |
-
"label2id": {
|
59 |
-
"crying": 0,
|
60 |
-
"no_crying": 1
|
61 |
-
},
|
62 |
"layer_norm_eps": 1e-05,
|
63 |
"layerdrop": 0.0,
|
64 |
"mask_feature_length": 10,
|
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
|
|
|
|
|
|
|
|
58 |
"layer_norm_eps": 1e-05,
|
59 |
"layerdrop": 0.0,
|
60 |
"mask_feature_length": 10,
|
checkpoint-170/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 94763496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c27ce70effb26d2c4fae3a9e5f9435a7adf1d9096be67f3e04eaf7266135f148
|
3 |
size 94763496
|
checkpoint-170/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 189552570
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f521c92737364b558a7a1f423ef220dcbbcf0650e982c3e4d1b202ec007872c8
|
3 |
size 189552570
|
checkpoint-170/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba2c60537414c36d76239817fe1c8be075bed144e4b9d191a70b981deda17823
|
3 |
size 1064
|
checkpoint-170/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-170",
|
4 |
"epoch": 1.9912152269399708,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 170,
|
@@ -10,33 +10,33 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
-
"eval_accuracy": 0.
|
14 |
-
"eval_f1": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_precision": 0.
|
17 |
-
"eval_recall": 0.
|
18 |
-
"eval_runtime":
|
19 |
-
"eval_samples_per_second":
|
20 |
-
"eval_steps_per_second":
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
-
"eval_accuracy": 0.
|
26 |
-
"eval_f1": 0.
|
27 |
-
"eval_loss": 0.
|
28 |
-
"eval_precision": 0.
|
29 |
-
"eval_recall": 0.
|
30 |
-
"eval_runtime":
|
31 |
-
"eval_samples_per_second":
|
32 |
-
"eval_steps_per_second": 28.
|
33 |
"step": 170
|
34 |
}
|
35 |
],
|
36 |
"logging_steps": 500,
|
37 |
-
"max_steps":
|
38 |
"num_input_tokens_seen": 0,
|
39 |
-
"num_train_epochs":
|
40 |
"save_steps": 500,
|
41 |
"stateful_callbacks": {
|
42 |
"EarlyStoppingCallback": {
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.9831501831501831,
|
3 |
+
"best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-170",
|
4 |
"epoch": 1.9912152269399708,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 170,
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
+
"eval_accuracy": 0.9538461538461539,
|
14 |
+
"eval_f1": 0.9535883665206972,
|
15 |
+
"eval_loss": 0.11965569853782654,
|
16 |
+
"eval_precision": 0.9535470731605858,
|
17 |
+
"eval_recall": 0.9538461538461539,
|
18 |
+
"eval_runtime": 5.8661,
|
19 |
+
"eval_samples_per_second": 232.691,
|
20 |
+
"eval_steps_per_second": 29.15,
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9831501831501831,
|
26 |
+
"eval_f1": 0.983143153392684,
|
27 |
+
"eval_loss": 0.060115572065114975,
|
28 |
+
"eval_precision": 0.9831374404084774,
|
29 |
+
"eval_recall": 0.9831501831501831,
|
30 |
+
"eval_runtime": 5.9254,
|
31 |
+
"eval_samples_per_second": 230.365,
|
32 |
+
"eval_steps_per_second": 28.859,
|
33 |
"step": 170
|
34 |
}
|
35 |
],
|
36 |
"logging_steps": 500,
|
37 |
+
"max_steps": 850,
|
38 |
"num_input_tokens_seen": 0,
|
39 |
+
"num_train_epochs": 10,
|
40 |
"save_steps": 500,
|
41 |
"stateful_callbacks": {
|
42 |
"EarlyStoppingCallback": {
|
checkpoint-170/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5240
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
|
3 |
size 5240
|
checkpoint-256/config.json
CHANGED
@@ -55,10 +55,6 @@
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
58 |
-
"label2id": {
|
59 |
-
"crying": 0,
|
60 |
-
"no_crying": 1
|
61 |
-
},
|
62 |
"layer_norm_eps": 1e-05,
|
63 |
"layerdrop": 0.0,
|
64 |
"mask_feature_length": 10,
|
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
|
|
|
|
|
|
|
|
58 |
"layer_norm_eps": 1e-05,
|
59 |
"layerdrop": 0.0,
|
60 |
"mask_feature_length": 10,
|
checkpoint-256/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 94763496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2992b8dfd27781b5920e6b800dd0bec2a8809a5eb8c0508b6726dd68807c3b6d
|
3 |
size 94763496
|
checkpoint-256/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 189552570
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb0f801198c29f1cc11cf39d019a185562336bfbfdee4056f15cc25e0604767a
|
3 |
size 189552570
|
checkpoint-256/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ea8c99bcd3f4c186db34ca4e9cbe89b586ea3bd6cf9703b17e9ec1f6c1ff961
|
3 |
size 1064
|
checkpoint-256/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-256",
|
4 |
"epoch": 2.998535871156662,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 256,
|
@@ -10,45 +10,45 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
-
"eval_accuracy": 0.
|
14 |
-
"eval_f1": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_precision": 0.
|
17 |
-
"eval_recall": 0.
|
18 |
-
"eval_runtime":
|
19 |
-
"eval_samples_per_second":
|
20 |
-
"eval_steps_per_second":
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
-
"eval_accuracy": 0.
|
26 |
-
"eval_f1": 0.
|
27 |
-
"eval_loss": 0.
|
28 |
-
"eval_precision": 0.
|
29 |
-
"eval_recall": 0.
|
30 |
-
"eval_runtime":
|
31 |
-
"eval_samples_per_second":
|
32 |
-
"eval_steps_per_second": 28.
|
33 |
"step": 170
|
34 |
},
|
35 |
{
|
36 |
"epoch": 2.998535871156662,
|
37 |
-
"eval_accuracy": 0.
|
38 |
-
"eval_f1": 0.
|
39 |
-
"eval_loss": 0.
|
40 |
-
"eval_precision": 0.
|
41 |
-
"eval_recall": 0.
|
42 |
-
"eval_runtime":
|
43 |
-
"eval_samples_per_second":
|
44 |
-
"eval_steps_per_second": 28.
|
45 |
"step": 256
|
46 |
}
|
47 |
],
|
48 |
"logging_steps": 500,
|
49 |
-
"max_steps":
|
50 |
"num_input_tokens_seen": 0,
|
51 |
-
"num_train_epochs":
|
52 |
"save_steps": 500,
|
53 |
"stateful_callbacks": {
|
54 |
"EarlyStoppingCallback": {
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.9868131868131869,
|
3 |
+
"best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-256",
|
4 |
"epoch": 2.998535871156662,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 256,
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
+
"eval_accuracy": 0.9538461538461539,
|
14 |
+
"eval_f1": 0.9535883665206972,
|
15 |
+
"eval_loss": 0.11965569853782654,
|
16 |
+
"eval_precision": 0.9535470731605858,
|
17 |
+
"eval_recall": 0.9538461538461539,
|
18 |
+
"eval_runtime": 5.8661,
|
19 |
+
"eval_samples_per_second": 232.691,
|
20 |
+
"eval_steps_per_second": 29.15,
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9831501831501831,
|
26 |
+
"eval_f1": 0.983143153392684,
|
27 |
+
"eval_loss": 0.060115572065114975,
|
28 |
+
"eval_precision": 0.9831374404084774,
|
29 |
+
"eval_recall": 0.9831501831501831,
|
30 |
+
"eval_runtime": 5.9254,
|
31 |
+
"eval_samples_per_second": 230.365,
|
32 |
+
"eval_steps_per_second": 28.859,
|
33 |
"step": 170
|
34 |
},
|
35 |
{
|
36 |
"epoch": 2.998535871156662,
|
37 |
+
"eval_accuracy": 0.9868131868131869,
|
38 |
+
"eval_f1": 0.9868241092241091,
|
39 |
+
"eval_loss": 0.05060575157403946,
|
40 |
+
"eval_precision": 0.9868403029537207,
|
41 |
+
"eval_recall": 0.9868131868131869,
|
42 |
+
"eval_runtime": 5.9299,
|
43 |
+
"eval_samples_per_second": 230.189,
|
44 |
+
"eval_steps_per_second": 28.837,
|
45 |
"step": 256
|
46 |
}
|
47 |
],
|
48 |
"logging_steps": 500,
|
49 |
+
"max_steps": 850,
|
50 |
"num_input_tokens_seen": 0,
|
51 |
+
"num_train_epochs": 10,
|
52 |
"save_steps": 500,
|
53 |
"stateful_callbacks": {
|
54 |
"EarlyStoppingCallback": {
|
checkpoint-256/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5240
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
|
3 |
size 5240
|
checkpoint-341/config.json
CHANGED
@@ -55,10 +55,6 @@
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
58 |
-
"label2id": {
|
59 |
-
"crying": 0,
|
60 |
-
"no_crying": 1
|
61 |
-
},
|
62 |
"layer_norm_eps": 1e-05,
|
63 |
"layerdrop": 0.0,
|
64 |
"mask_feature_length": 10,
|
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
|
|
|
|
|
|
|
|
58 |
"layer_norm_eps": 1e-05,
|
59 |
"layerdrop": 0.0,
|
60 |
"mask_feature_length": 10,
|
checkpoint-341/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 94763496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3fb881f587c38faf027d9d2f92c1142607ce7f334b76baccc3fafe76fbc4f38
|
3 |
size 94763496
|
checkpoint-341/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 189552570
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62cf0c2fa4abd219e7fa80805ad290927ba54a46ecf6203e78bc102ea268400c
|
3 |
size 189552570
|
checkpoint-341/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-
|
4 |
"epoch": 3.994143484626647,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 341,
|
@@ -10,50 +10,50 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
-
"eval_accuracy": 0.
|
14 |
-
"eval_f1": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_precision": 0.
|
17 |
-
"eval_recall": 0.
|
18 |
-
"eval_runtime":
|
19 |
-
"eval_samples_per_second":
|
20 |
-
"eval_steps_per_second":
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
-
"eval_accuracy": 0.
|
26 |
-
"eval_f1": 0.
|
27 |
-
"eval_loss": 0.
|
28 |
-
"eval_precision": 0.
|
29 |
-
"eval_recall": 0.
|
30 |
-
"eval_runtime": 5.
|
31 |
-
"eval_samples_per_second":
|
32 |
-
"eval_steps_per_second":
|
33 |
"step": 170
|
34 |
},
|
35 |
{
|
36 |
"epoch": 2.998535871156662,
|
37 |
"eval_accuracy": 0.9868131868131869,
|
38 |
-
"eval_f1": 0.
|
39 |
-
"eval_loss": 0.
|
40 |
-
"eval_precision": 0.
|
41 |
"eval_recall": 0.9868131868131869,
|
42 |
-
"eval_runtime":
|
43 |
-
"eval_samples_per_second":
|
44 |
-
"eval_steps_per_second":
|
45 |
"step": 256
|
46 |
},
|
47 |
{
|
48 |
"epoch": 3.994143484626647,
|
49 |
-
"eval_accuracy": 0.
|
50 |
-
"eval_f1": 0.
|
51 |
-
"eval_loss": 0.
|
52 |
-
"eval_precision": 0.
|
53 |
-
"eval_recall": 0.
|
54 |
-
"eval_runtime":
|
55 |
-
"eval_samples_per_second":
|
56 |
-
"eval_steps_per_second":
|
57 |
"step": 341
|
58 |
}
|
59 |
],
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.9868131868131869,
|
3 |
+
"best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-256",
|
4 |
"epoch": 3.994143484626647,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 341,
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
+
"eval_accuracy": 0.9538461538461539,
|
14 |
+
"eval_f1": 0.9535883665206972,
|
15 |
+
"eval_loss": 0.11965569853782654,
|
16 |
+
"eval_precision": 0.9535470731605858,
|
17 |
+
"eval_recall": 0.9538461538461539,
|
18 |
+
"eval_runtime": 5.8661,
|
19 |
+
"eval_samples_per_second": 232.691,
|
20 |
+
"eval_steps_per_second": 29.15,
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9831501831501831,
|
26 |
+
"eval_f1": 0.983143153392684,
|
27 |
+
"eval_loss": 0.060115572065114975,
|
28 |
+
"eval_precision": 0.9831374404084774,
|
29 |
+
"eval_recall": 0.9831501831501831,
|
30 |
+
"eval_runtime": 5.9254,
|
31 |
+
"eval_samples_per_second": 230.365,
|
32 |
+
"eval_steps_per_second": 28.859,
|
33 |
"step": 170
|
34 |
},
|
35 |
{
|
36 |
"epoch": 2.998535871156662,
|
37 |
"eval_accuracy": 0.9868131868131869,
|
38 |
+
"eval_f1": 0.9868241092241091,
|
39 |
+
"eval_loss": 0.05060575157403946,
|
40 |
+
"eval_precision": 0.9868403029537207,
|
41 |
"eval_recall": 0.9868131868131869,
|
42 |
+
"eval_runtime": 5.9299,
|
43 |
+
"eval_samples_per_second": 230.189,
|
44 |
+
"eval_steps_per_second": 28.837,
|
45 |
"step": 256
|
46 |
},
|
47 |
{
|
48 |
"epoch": 3.994143484626647,
|
49 |
+
"eval_accuracy": 0.9860805860805861,
|
50 |
+
"eval_f1": 0.9861535269385863,
|
51 |
+
"eval_loss": 0.04610973969101906,
|
52 |
+
"eval_precision": 0.986445121171901,
|
53 |
+
"eval_recall": 0.9860805860805861,
|
54 |
+
"eval_runtime": 5.9428,
|
55 |
+
"eval_samples_per_second": 229.69,
|
56 |
+
"eval_steps_per_second": 28.774,
|
57 |
"step": 341
|
58 |
}
|
59 |
],
|
checkpoint-341/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5240
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
|
3 |
size 5240
|
checkpoint-426/config.json
CHANGED
@@ -55,10 +55,6 @@
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
58 |
-
"label2id": {
|
59 |
-
"crying": 0,
|
60 |
-
"no_crying": 1
|
61 |
-
},
|
62 |
"layer_norm_eps": 1e-05,
|
63 |
"layerdrop": 0.0,
|
64 |
"mask_feature_length": 10,
|
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
|
|
|
|
|
|
|
|
58 |
"layer_norm_eps": 1e-05,
|
59 |
"layerdrop": 0.0,
|
60 |
"mask_feature_length": 10,
|
checkpoint-426/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 94763496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f21392d62c0aae2cb86ef601a6fdd136f97139074d9fc1a5418821cfd21d8f2f
|
3 |
size 94763496
|
checkpoint-426/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 189552570
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54aacdf3b8335705d217fdd88584f914b41fdc67436f327708a19652d4774b8e
|
3 |
size 189552570
|
checkpoint-426/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:579ef0f1564878cc661672a4c8ce1e561a689fa403a5862a5af2e3ad39ed51e9
|
3 |
size 1064
|
checkpoint-426/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-
|
4 |
"epoch": 4.989751098096632,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 426,
|
@@ -10,69 +10,69 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
-
"eval_accuracy": 0.
|
14 |
-
"eval_f1": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_precision": 0.
|
17 |
-
"eval_recall": 0.
|
18 |
-
"eval_runtime":
|
19 |
-
"eval_samples_per_second":
|
20 |
-
"eval_steps_per_second":
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
-
"eval_accuracy": 0.
|
26 |
-
"eval_f1": 0.
|
27 |
-
"eval_loss": 0.
|
28 |
-
"eval_precision": 0.
|
29 |
-
"eval_recall": 0.
|
30 |
-
"eval_runtime":
|
31 |
-
"eval_samples_per_second":
|
32 |
-
"eval_steps_per_second":
|
33 |
"step": 170
|
34 |
},
|
35 |
{
|
36 |
"epoch": 2.998535871156662,
|
37 |
-
"eval_accuracy": 0.
|
38 |
-
"eval_f1": 0.
|
39 |
-
"eval_loss": 0.
|
40 |
-
"eval_precision": 0.
|
41 |
-
"eval_recall": 0.
|
42 |
-
"eval_runtime": 5.
|
43 |
-
"eval_samples_per_second":
|
44 |
-
"eval_steps_per_second": 28.
|
45 |
"step": 256
|
46 |
},
|
47 |
{
|
48 |
"epoch": 3.994143484626647,
|
49 |
-
"eval_accuracy": 0.
|
50 |
-
"eval_f1": 0.
|
51 |
-
"eval_loss": 0.
|
52 |
-
"eval_precision": 0.
|
53 |
-
"eval_recall": 0.
|
54 |
-
"eval_runtime":
|
55 |
-
"eval_samples_per_second":
|
56 |
-
"eval_steps_per_second":
|
57 |
"step": 341
|
58 |
},
|
59 |
{
|
60 |
"epoch": 4.989751098096632,
|
61 |
-
"eval_accuracy": 0.
|
62 |
-
"eval_f1": 0.
|
63 |
-
"eval_loss": 0.
|
64 |
-
"eval_precision": 0.
|
65 |
-
"eval_recall": 0.
|
66 |
-
"eval_runtime":
|
67 |
-
"eval_samples_per_second":
|
68 |
-
"eval_steps_per_second":
|
69 |
"step": 426
|
70 |
}
|
71 |
],
|
72 |
"logging_steps": 500,
|
73 |
-
"max_steps":
|
74 |
"num_input_tokens_seen": 0,
|
75 |
-
"num_train_epochs":
|
76 |
"save_steps": 500,
|
77 |
"stateful_callbacks": {
|
78 |
"EarlyStoppingCallback": {
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.989010989010989,
|
3 |
+
"best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-426",
|
4 |
"epoch": 4.989751098096632,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 426,
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
+
"eval_accuracy": 0.9538461538461539,
|
14 |
+
"eval_f1": 0.9535883665206972,
|
15 |
+
"eval_loss": 0.11965569853782654,
|
16 |
+
"eval_precision": 0.9535470731605858,
|
17 |
+
"eval_recall": 0.9538461538461539,
|
18 |
+
"eval_runtime": 5.8661,
|
19 |
+
"eval_samples_per_second": 232.691,
|
20 |
+
"eval_steps_per_second": 29.15,
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9831501831501831,
|
26 |
+
"eval_f1": 0.983143153392684,
|
27 |
+
"eval_loss": 0.060115572065114975,
|
28 |
+
"eval_precision": 0.9831374404084774,
|
29 |
+
"eval_recall": 0.9831501831501831,
|
30 |
+
"eval_runtime": 5.9254,
|
31 |
+
"eval_samples_per_second": 230.365,
|
32 |
+
"eval_steps_per_second": 28.859,
|
33 |
"step": 170
|
34 |
},
|
35 |
{
|
36 |
"epoch": 2.998535871156662,
|
37 |
+
"eval_accuracy": 0.9868131868131869,
|
38 |
+
"eval_f1": 0.9868241092241091,
|
39 |
+
"eval_loss": 0.05060575157403946,
|
40 |
+
"eval_precision": 0.9868403029537207,
|
41 |
+
"eval_recall": 0.9868131868131869,
|
42 |
+
"eval_runtime": 5.9299,
|
43 |
+
"eval_samples_per_second": 230.189,
|
44 |
+
"eval_steps_per_second": 28.837,
|
45 |
"step": 256
|
46 |
},
|
47 |
{
|
48 |
"epoch": 3.994143484626647,
|
49 |
+
"eval_accuracy": 0.9860805860805861,
|
50 |
+
"eval_f1": 0.9861535269385863,
|
51 |
+
"eval_loss": 0.04610973969101906,
|
52 |
+
"eval_precision": 0.986445121171901,
|
53 |
+
"eval_recall": 0.9860805860805861,
|
54 |
+
"eval_runtime": 5.9428,
|
55 |
+
"eval_samples_per_second": 229.69,
|
56 |
+
"eval_steps_per_second": 28.774,
|
57 |
"step": 341
|
58 |
},
|
59 |
{
|
60 |
"epoch": 4.989751098096632,
|
61 |
+
"eval_accuracy": 0.989010989010989,
|
62 |
+
"eval_f1": 0.9890246085529585,
|
63 |
+
"eval_loss": 0.0438910573720932,
|
64 |
+
"eval_precision": 0.989050109460552,
|
65 |
+
"eval_recall": 0.989010989010989,
|
66 |
+
"eval_runtime": 5.937,
|
67 |
+
"eval_samples_per_second": 229.913,
|
68 |
+
"eval_steps_per_second": 28.802,
|
69 |
"step": 426
|
70 |
}
|
71 |
],
|
72 |
"logging_steps": 500,
|
73 |
+
"max_steps": 850,
|
74 |
"num_input_tokens_seen": 0,
|
75 |
+
"num_train_epochs": 10,
|
76 |
"save_steps": 500,
|
77 |
"stateful_callbacks": {
|
78 |
"EarlyStoppingCallback": {
|
checkpoint-426/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5240
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
|
3 |
size 5240
|
checkpoint-512/config.json
CHANGED
@@ -55,10 +55,6 @@
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
58 |
-
"label2id": {
|
59 |
-
"crying": 0,
|
60 |
-
"no_crying": 1
|
61 |
-
},
|
62 |
"layer_norm_eps": 1e-05,
|
63 |
"layerdrop": 0.0,
|
64 |
"mask_feature_length": 10,
|
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
|
|
|
|
|
|
|
|
58 |
"layer_norm_eps": 1e-05,
|
59 |
"layerdrop": 0.0,
|
60 |
"mask_feature_length": 10,
|
checkpoint-512/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 94763496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35f0fba66e2bc44178994b63877f32d5ef3660e920cd130dae9ccbf8e054d15a
|
3 |
size 94763496
|
checkpoint-512/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 189552570
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32489c4cc27d23701cd78e51f1daf46563d47112b4e3520ad9568800f0b86fb3
|
3 |
size 189552570
|
checkpoint-512/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0643374a18b5da11030bd13ba87a30fd86ee77d7702b1fa1d0aee2f444563b7c
|
3 |
size 1064
|
checkpoint-512/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-
|
4 |
"epoch": 5.997071742313324,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 512,
|
@@ -11,80 +11,80 @@
|
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
"eval_accuracy": 0.9538461538461539,
|
14 |
-
"eval_f1": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_precision": 0.
|
17 |
"eval_recall": 0.9538461538461539,
|
18 |
-
"eval_runtime": 5.
|
19 |
-
"eval_samples_per_second":
|
20 |
-
"eval_steps_per_second":
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
-
"eval_accuracy": 0.
|
26 |
-
"eval_f1": 0.
|
27 |
-
"eval_loss": 0.
|
28 |
-
"eval_precision": 0.
|
29 |
-
"eval_recall": 0.
|
30 |
-
"eval_runtime": 5.
|
31 |
-
"eval_samples_per_second": 230.
|
32 |
-
"eval_steps_per_second": 28.
|
33 |
"step": 170
|
34 |
},
|
35 |
{
|
36 |
"epoch": 2.998535871156662,
|
37 |
-
"eval_accuracy": 0.
|
38 |
-
"eval_f1": 0.
|
39 |
-
"eval_loss": 0.
|
40 |
-
"eval_precision": 0.
|
41 |
-
"eval_recall": 0.
|
42 |
-
"eval_runtime": 5.
|
43 |
-
"eval_samples_per_second": 230.
|
44 |
-
"eval_steps_per_second": 28.
|
45 |
"step": 256
|
46 |
},
|
47 |
{
|
48 |
"epoch": 3.994143484626647,
|
49 |
-
"eval_accuracy": 0.
|
50 |
-
"eval_f1": 0.
|
51 |
-
"eval_loss": 0.
|
52 |
-
"eval_precision": 0.
|
53 |
-
"eval_recall": 0.
|
54 |
-
"eval_runtime": 5.
|
55 |
-
"eval_samples_per_second":
|
56 |
-
"eval_steps_per_second": 28.
|
57 |
"step": 341
|
58 |
},
|
59 |
{
|
60 |
"epoch": 4.989751098096632,
|
61 |
-
"eval_accuracy": 0.
|
62 |
-
"eval_f1": 0.
|
63 |
-
"eval_loss": 0.
|
64 |
-
"eval_precision": 0.
|
65 |
-
"eval_recall": 0.
|
66 |
-
"eval_runtime": 5.
|
67 |
-
"eval_samples_per_second":
|
68 |
-
"eval_steps_per_second": 28.
|
69 |
"step": 426
|
70 |
},
|
71 |
{
|
72 |
"epoch": 5.856515373352855,
|
73 |
-
"grad_norm": 0.
|
74 |
-
"learning_rate": 1.
|
75 |
-
"loss": 0.
|
76 |
"step": 500
|
77 |
},
|
78 |
{
|
79 |
"epoch": 5.997071742313324,
|
80 |
-
"eval_accuracy": 0.
|
81 |
-
"eval_f1": 0.
|
82 |
-
"eval_loss": 0.
|
83 |
-
"eval_precision": 0.
|
84 |
-
"eval_recall": 0.
|
85 |
-
"eval_runtime": 5.
|
86 |
-
"eval_samples_per_second":
|
87 |
-
"eval_steps_per_second":
|
88 |
"step": 512
|
89 |
}
|
90 |
],
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.9904761904761905,
|
3 |
+
"best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-512",
|
4 |
"epoch": 5.997071742313324,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 512,
|
|
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
"eval_accuracy": 0.9538461538461539,
|
14 |
+
"eval_f1": 0.9535883665206972,
|
15 |
+
"eval_loss": 0.11965569853782654,
|
16 |
+
"eval_precision": 0.9535470731605858,
|
17 |
"eval_recall": 0.9538461538461539,
|
18 |
+
"eval_runtime": 5.8661,
|
19 |
+
"eval_samples_per_second": 232.691,
|
20 |
+
"eval_steps_per_second": 29.15,
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9831501831501831,
|
26 |
+
"eval_f1": 0.983143153392684,
|
27 |
+
"eval_loss": 0.060115572065114975,
|
28 |
+
"eval_precision": 0.9831374404084774,
|
29 |
+
"eval_recall": 0.9831501831501831,
|
30 |
+
"eval_runtime": 5.9254,
|
31 |
+
"eval_samples_per_second": 230.365,
|
32 |
+
"eval_steps_per_second": 28.859,
|
33 |
"step": 170
|
34 |
},
|
35 |
{
|
36 |
"epoch": 2.998535871156662,
|
37 |
+
"eval_accuracy": 0.9868131868131869,
|
38 |
+
"eval_f1": 0.9868241092241091,
|
39 |
+
"eval_loss": 0.05060575157403946,
|
40 |
+
"eval_precision": 0.9868403029537207,
|
41 |
+
"eval_recall": 0.9868131868131869,
|
42 |
+
"eval_runtime": 5.9299,
|
43 |
+
"eval_samples_per_second": 230.189,
|
44 |
+
"eval_steps_per_second": 28.837,
|
45 |
"step": 256
|
46 |
},
|
47 |
{
|
48 |
"epoch": 3.994143484626647,
|
49 |
+
"eval_accuracy": 0.9860805860805861,
|
50 |
+
"eval_f1": 0.9861535269385863,
|
51 |
+
"eval_loss": 0.04610973969101906,
|
52 |
+
"eval_precision": 0.986445121171901,
|
53 |
+
"eval_recall": 0.9860805860805861,
|
54 |
+
"eval_runtime": 5.9428,
|
55 |
+
"eval_samples_per_second": 229.69,
|
56 |
+
"eval_steps_per_second": 28.774,
|
57 |
"step": 341
|
58 |
},
|
59 |
{
|
60 |
"epoch": 4.989751098096632,
|
61 |
+
"eval_accuracy": 0.989010989010989,
|
62 |
+
"eval_f1": 0.9890246085529585,
|
63 |
+
"eval_loss": 0.0438910573720932,
|
64 |
+
"eval_precision": 0.989050109460552,
|
65 |
+
"eval_recall": 0.989010989010989,
|
66 |
+
"eval_runtime": 5.937,
|
67 |
+
"eval_samples_per_second": 229.913,
|
68 |
+
"eval_steps_per_second": 28.802,
|
69 |
"step": 426
|
70 |
},
|
71 |
{
|
72 |
"epoch": 5.856515373352855,
|
73 |
+
"grad_norm": 0.08060992509126663,
|
74 |
+
"learning_rate": 1.0917042498003083e-05,
|
75 |
+
"loss": 0.0779,
|
76 |
"step": 500
|
77 |
},
|
78 |
{
|
79 |
"epoch": 5.997071742313324,
|
80 |
+
"eval_accuracy": 0.9904761904761905,
|
81 |
+
"eval_f1": 0.9904879940792306,
|
82 |
+
"eval_loss": 0.0396205335855484,
|
83 |
+
"eval_precision": 0.9905117057078526,
|
84 |
+
"eval_recall": 0.9904761904761905,
|
85 |
+
"eval_runtime": 5.9047,
|
86 |
+
"eval_samples_per_second": 231.172,
|
87 |
+
"eval_steps_per_second": 28.96,
|
88 |
"step": 512
|
89 |
}
|
90 |
],
|
checkpoint-512/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5240
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
|
3 |
size 5240
|
checkpoint-597/config.json
CHANGED
@@ -55,10 +55,6 @@
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
58 |
-
"label2id": {
|
59 |
-
"crying": 0,
|
60 |
-
"no_crying": 1
|
61 |
-
},
|
62 |
"layer_norm_eps": 1e-05,
|
63 |
"layerdrop": 0.0,
|
64 |
"mask_feature_length": 10,
|
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
|
|
|
|
|
|
|
|
58 |
"layer_norm_eps": 1e-05,
|
59 |
"layerdrop": 0.0,
|
60 |
"mask_feature_length": 10,
|
checkpoint-597/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 94763496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fefc9fc9e0c6f521d52f6944550be09ad08cf2a406465b2bad96d43e8e656a9
|
3 |
size 94763496
|
checkpoint-597/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 189552570
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de0a5be77c65d20eadb1a24d44af2c728f76e6c9b01b584c11efa9dac4bab929
|
3 |
size 189552570
|
checkpoint-597/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65e5b7798f882f09e50f351045d72a3f8133a68153dae42b3d7541432cd2e9e0
|
3 |
size 1064
|
checkpoint-597/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-
|
4 |
"epoch": 6.992679355783309,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 597,
|
@@ -11,92 +11,92 @@
|
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
"eval_accuracy": 0.9538461538461539,
|
14 |
-
"eval_f1": 0.
|
15 |
-
"eval_loss": 0.
|
16 |
-
"eval_precision": 0.
|
17 |
"eval_recall": 0.9538461538461539,
|
18 |
-
"eval_runtime": 5.
|
19 |
-
"eval_samples_per_second":
|
20 |
-
"eval_steps_per_second":
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
-
"eval_accuracy": 0.
|
26 |
-
"eval_f1": 0.
|
27 |
-
"eval_loss": 0.
|
28 |
-
"eval_precision": 0.
|
29 |
-
"eval_recall": 0.
|
30 |
-
"eval_runtime": 5.
|
31 |
-
"eval_samples_per_second": 230.
|
32 |
-
"eval_steps_per_second": 28.
|
33 |
"step": 170
|
34 |
},
|
35 |
{
|
36 |
"epoch": 2.998535871156662,
|
37 |
-
"eval_accuracy": 0.
|
38 |
-
"eval_f1": 0.
|
39 |
-
"eval_loss": 0.
|
40 |
-
"eval_precision": 0.
|
41 |
-
"eval_recall": 0.
|
42 |
-
"eval_runtime": 5.
|
43 |
-
"eval_samples_per_second": 230.
|
44 |
-
"eval_steps_per_second": 28.
|
45 |
"step": 256
|
46 |
},
|
47 |
{
|
48 |
"epoch": 3.994143484626647,
|
49 |
-
"eval_accuracy": 0.
|
50 |
-
"eval_f1": 0.
|
51 |
-
"eval_loss": 0.
|
52 |
-
"eval_precision": 0.
|
53 |
-
"eval_recall": 0.
|
54 |
-
"eval_runtime": 5.
|
55 |
-
"eval_samples_per_second":
|
56 |
-
"eval_steps_per_second": 28.
|
57 |
"step": 341
|
58 |
},
|
59 |
{
|
60 |
"epoch": 4.989751098096632,
|
61 |
-
"eval_accuracy": 0.
|
62 |
-
"eval_f1": 0.
|
63 |
-
"eval_loss": 0.
|
64 |
-
"eval_precision": 0.
|
65 |
-
"eval_recall": 0.
|
66 |
-
"eval_runtime": 5.
|
67 |
-
"eval_samples_per_second":
|
68 |
-
"eval_steps_per_second": 28.
|
69 |
"step": 426
|
70 |
},
|
71 |
{
|
72 |
"epoch": 5.856515373352855,
|
73 |
-
"grad_norm": 0.
|
74 |
-
"learning_rate": 1.
|
75 |
-
"loss": 0.
|
76 |
"step": 500
|
77 |
},
|
78 |
{
|
79 |
"epoch": 5.997071742313324,
|
80 |
-
"eval_accuracy": 0.
|
81 |
-
"eval_f1": 0.
|
82 |
-
"eval_loss": 0.
|
83 |
-
"eval_precision": 0.
|
84 |
-
"eval_recall": 0.
|
85 |
-
"eval_runtime": 5.
|
86 |
-
"eval_samples_per_second":
|
87 |
-
"eval_steps_per_second":
|
88 |
"step": 512
|
89 |
},
|
90 |
{
|
91 |
"epoch": 6.992679355783309,
|
92 |
-
"eval_accuracy": 0.
|
93 |
-
"eval_f1": 0.
|
94 |
-
"eval_loss": 0.
|
95 |
-
"eval_precision": 0.
|
96 |
-
"eval_recall": 0.
|
97 |
-
"eval_runtime":
|
98 |
-
"eval_samples_per_second":
|
99 |
-
"eval_steps_per_second":
|
100 |
"step": 597
|
101 |
}
|
102 |
],
|
@@ -121,7 +121,7 @@
|
|
121 |
"should_evaluate": false,
|
122 |
"should_log": false,
|
123 |
"should_save": true,
|
124 |
-
"should_training_stop":
|
125 |
},
|
126 |
"attributes": {}
|
127 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.991941391941392,
|
3 |
+
"best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-597",
|
4 |
"epoch": 6.992679355783309,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 597,
|
|
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
"eval_accuracy": 0.9538461538461539,
|
14 |
+
"eval_f1": 0.9535883665206972,
|
15 |
+
"eval_loss": 0.11965569853782654,
|
16 |
+
"eval_precision": 0.9535470731605858,
|
17 |
"eval_recall": 0.9538461538461539,
|
18 |
+
"eval_runtime": 5.8661,
|
19 |
+
"eval_samples_per_second": 232.691,
|
20 |
+
"eval_steps_per_second": 29.15,
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9831501831501831,
|
26 |
+
"eval_f1": 0.983143153392684,
|
27 |
+
"eval_loss": 0.060115572065114975,
|
28 |
+
"eval_precision": 0.9831374404084774,
|
29 |
+
"eval_recall": 0.9831501831501831,
|
30 |
+
"eval_runtime": 5.9254,
|
31 |
+
"eval_samples_per_second": 230.365,
|
32 |
+
"eval_steps_per_second": 28.859,
|
33 |
"step": 170
|
34 |
},
|
35 |
{
|
36 |
"epoch": 2.998535871156662,
|
37 |
+
"eval_accuracy": 0.9868131868131869,
|
38 |
+
"eval_f1": 0.9868241092241091,
|
39 |
+
"eval_loss": 0.05060575157403946,
|
40 |
+
"eval_precision": 0.9868403029537207,
|
41 |
+
"eval_recall": 0.9868131868131869,
|
42 |
+
"eval_runtime": 5.9299,
|
43 |
+
"eval_samples_per_second": 230.189,
|
44 |
+
"eval_steps_per_second": 28.837,
|
45 |
"step": 256
|
46 |
},
|
47 |
{
|
48 |
"epoch": 3.994143484626647,
|
49 |
+
"eval_accuracy": 0.9860805860805861,
|
50 |
+
"eval_f1": 0.9861535269385863,
|
51 |
+
"eval_loss": 0.04610973969101906,
|
52 |
+
"eval_precision": 0.986445121171901,
|
53 |
+
"eval_recall": 0.9860805860805861,
|
54 |
+
"eval_runtime": 5.9428,
|
55 |
+
"eval_samples_per_second": 229.69,
|
56 |
+
"eval_steps_per_second": 28.774,
|
57 |
"step": 341
|
58 |
},
|
59 |
{
|
60 |
"epoch": 4.989751098096632,
|
61 |
+
"eval_accuracy": 0.989010989010989,
|
62 |
+
"eval_f1": 0.9890246085529585,
|
63 |
+
"eval_loss": 0.0438910573720932,
|
64 |
+
"eval_precision": 0.989050109460552,
|
65 |
+
"eval_recall": 0.989010989010989,
|
66 |
+
"eval_runtime": 5.937,
|
67 |
+
"eval_samples_per_second": 229.913,
|
68 |
+
"eval_steps_per_second": 28.802,
|
69 |
"step": 426
|
70 |
},
|
71 |
{
|
72 |
"epoch": 5.856515373352855,
|
73 |
+
"grad_norm": 0.08060992509126663,
|
74 |
+
"learning_rate": 1.0917042498003083e-05,
|
75 |
+
"loss": 0.0779,
|
76 |
"step": 500
|
77 |
},
|
78 |
{
|
79 |
"epoch": 5.997071742313324,
|
80 |
+
"eval_accuracy": 0.9904761904761905,
|
81 |
+
"eval_f1": 0.9904879940792306,
|
82 |
+
"eval_loss": 0.0396205335855484,
|
83 |
+
"eval_precision": 0.9905117057078526,
|
84 |
+
"eval_recall": 0.9904761904761905,
|
85 |
+
"eval_runtime": 5.9047,
|
86 |
+
"eval_samples_per_second": 231.172,
|
87 |
+
"eval_steps_per_second": 28.96,
|
88 |
"step": 512
|
89 |
},
|
90 |
{
|
91 |
"epoch": 6.992679355783309,
|
92 |
+
"eval_accuracy": 0.991941391941392,
|
93 |
+
"eval_f1": 0.9919447375447602,
|
94 |
+
"eval_loss": 0.035047151148319244,
|
95 |
+
"eval_precision": 0.9919494135494136,
|
96 |
+
"eval_recall": 0.991941391941392,
|
97 |
+
"eval_runtime": 6.0502,
|
98 |
+
"eval_samples_per_second": 225.612,
|
99 |
+
"eval_steps_per_second": 28.264,
|
100 |
"step": 597
|
101 |
}
|
102 |
],
|
|
|
121 |
"should_evaluate": false,
|
122 |
"should_log": false,
|
123 |
"should_save": true,
|
124 |
+
"should_training_stop": false
|
125 |
},
|
126 |
"attributes": {}
|
127 |
}
|
checkpoint-597/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5240
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
|
3 |
size 5240
|
checkpoint-683/config.json
CHANGED
@@ -45,6 +45,7 @@
|
|
45 |
"feat_proj_dropout": 0.0,
|
46 |
"feat_proj_layer_norm": false,
|
47 |
"final_dropout": 0.0,
|
|
|
48 |
"hidden_act": "gelu",
|
49 |
"hidden_dropout": 0.1,
|
50 |
"hidden_size": 768,
|
@@ -54,10 +55,6 @@
|
|
54 |
},
|
55 |
"initializer_range": 0.02,
|
56 |
"intermediate_size": 3072,
|
57 |
-
"label2id": {
|
58 |
-
"crying": "0",
|
59 |
-
"no_crying": "1"
|
60 |
-
},
|
61 |
"layer_norm_eps": 1e-05,
|
62 |
"layerdrop": 0.0,
|
63 |
"mask_feature_length": 10,
|
|
|
45 |
"feat_proj_dropout": 0.0,
|
46 |
"feat_proj_layer_norm": false,
|
47 |
"final_dropout": 0.0,
|
48 |
+
"finetuning_task": "audio-classification",
|
49 |
"hidden_act": "gelu",
|
50 |
"hidden_dropout": 0.1,
|
51 |
"hidden_size": 768,
|
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
|
|
|
|
|
|
|
|
58 |
"layer_norm_eps": 1e-05,
|
59 |
"layerdrop": 0.0,
|
60 |
"mask_feature_length": 10,
|
checkpoint-683/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 94763496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47eb6b3cfe6fa933d4d9bda0995a1e235c1d9ec1d2481708bed5a4149e8262a4
|
3 |
size 94763496
|
checkpoint-683/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 189552570
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccd75da0e8ea0bf33fb98b23e1d8b9fc9f33d7c31a91837683d49c15ae856034
|
3 |
size 189552570
|
checkpoint-683/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bde01021f76a64b9ec7866fcc536e72a45008d7566739a02f03c4c895a14c72c
|
3 |
size 1064
|
checkpoint-683/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-
|
4 |
"epoch": 8.0,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 683,
|
@@ -10,81 +10,105 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
-
"eval_accuracy": 0.
|
14 |
-
"
|
15 |
-
"
|
16 |
-
"
|
17 |
-
"
|
|
|
|
|
|
|
18 |
"step": 85
|
19 |
},
|
20 |
{
|
21 |
"epoch": 1.9912152269399708,
|
22 |
-
"eval_accuracy": 0.
|
23 |
-
"
|
24 |
-
"
|
25 |
-
"
|
26 |
-
"
|
|
|
|
|
|
|
27 |
"step": 170
|
28 |
},
|
29 |
{
|
30 |
"epoch": 2.998535871156662,
|
31 |
-
"eval_accuracy": 0.
|
32 |
-
"
|
33 |
-
"
|
34 |
-
"
|
35 |
-
"
|
|
|
|
|
|
|
36 |
"step": 256
|
37 |
},
|
38 |
{
|
39 |
"epoch": 3.994143484626647,
|
40 |
-
"eval_accuracy": 0.
|
41 |
-
"
|
42 |
-
"
|
43 |
-
"
|
44 |
-
"
|
|
|
|
|
|
|
45 |
"step": 341
|
46 |
},
|
47 |
{
|
48 |
"epoch": 4.989751098096632,
|
49 |
-
"eval_accuracy": 0.
|
50 |
-
"
|
51 |
-
"
|
52 |
-
"
|
53 |
-
"
|
|
|
|
|
|
|
54 |
"step": 426
|
55 |
},
|
56 |
{
|
57 |
"epoch": 5.856515373352855,
|
58 |
-
"grad_norm": 0.
|
59 |
-
"learning_rate":
|
60 |
-
"loss": 0.
|
61 |
"step": 500
|
62 |
},
|
63 |
{
|
64 |
"epoch": 5.997071742313324,
|
65 |
-
"eval_accuracy": 0.
|
66 |
-
"
|
67 |
-
"
|
68 |
-
"
|
69 |
-
"
|
|
|
|
|
|
|
70 |
"step": 512
|
71 |
},
|
72 |
{
|
73 |
"epoch": 6.992679355783309,
|
74 |
-
"eval_accuracy": 0.
|
75 |
-
"
|
76 |
-
"
|
77 |
-
"
|
78 |
-
"
|
|
|
|
|
|
|
79 |
"step": 597
|
80 |
},
|
81 |
{
|
82 |
"epoch": 8.0,
|
83 |
-
"eval_accuracy": 0.
|
84 |
-
"
|
85 |
-
"
|
86 |
-
"
|
87 |
-
"
|
|
|
|
|
|
|
88 |
"step": 683
|
89 |
}
|
90 |
],
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.991941391941392,
|
3 |
+
"best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-597",
|
4 |
"epoch": 8.0,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 683,
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
+
"eval_accuracy": 0.9538461538461539,
|
14 |
+
"eval_f1": 0.9535883665206972,
|
15 |
+
"eval_loss": 0.11965569853782654,
|
16 |
+
"eval_precision": 0.9535470731605858,
|
17 |
+
"eval_recall": 0.9538461538461539,
|
18 |
+
"eval_runtime": 5.8661,
|
19 |
+
"eval_samples_per_second": 232.691,
|
20 |
+
"eval_steps_per_second": 29.15,
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9831501831501831,
|
26 |
+
"eval_f1": 0.983143153392684,
|
27 |
+
"eval_loss": 0.060115572065114975,
|
28 |
+
"eval_precision": 0.9831374404084774,
|
29 |
+
"eval_recall": 0.9831501831501831,
|
30 |
+
"eval_runtime": 5.9254,
|
31 |
+
"eval_samples_per_second": 230.365,
|
32 |
+
"eval_steps_per_second": 28.859,
|
33 |
"step": 170
|
34 |
},
|
35 |
{
|
36 |
"epoch": 2.998535871156662,
|
37 |
+
"eval_accuracy": 0.9868131868131869,
|
38 |
+
"eval_f1": 0.9868241092241091,
|
39 |
+
"eval_loss": 0.05060575157403946,
|
40 |
+
"eval_precision": 0.9868403029537207,
|
41 |
+
"eval_recall": 0.9868131868131869,
|
42 |
+
"eval_runtime": 5.9299,
|
43 |
+
"eval_samples_per_second": 230.189,
|
44 |
+
"eval_steps_per_second": 28.837,
|
45 |
"step": 256
|
46 |
},
|
47 |
{
|
48 |
"epoch": 3.994143484626647,
|
49 |
+
"eval_accuracy": 0.9860805860805861,
|
50 |
+
"eval_f1": 0.9861535269385863,
|
51 |
+
"eval_loss": 0.04610973969101906,
|
52 |
+
"eval_precision": 0.986445121171901,
|
53 |
+
"eval_recall": 0.9860805860805861,
|
54 |
+
"eval_runtime": 5.9428,
|
55 |
+
"eval_samples_per_second": 229.69,
|
56 |
+
"eval_steps_per_second": 28.774,
|
57 |
"step": 341
|
58 |
},
|
59 |
{
|
60 |
"epoch": 4.989751098096632,
|
61 |
+
"eval_accuracy": 0.989010989010989,
|
62 |
+
"eval_f1": 0.9890246085529585,
|
63 |
+
"eval_loss": 0.0438910573720932,
|
64 |
+
"eval_precision": 0.989050109460552,
|
65 |
+
"eval_recall": 0.989010989010989,
|
66 |
+
"eval_runtime": 5.937,
|
67 |
+
"eval_samples_per_second": 229.913,
|
68 |
+
"eval_steps_per_second": 28.802,
|
69 |
"step": 426
|
70 |
},
|
71 |
{
|
72 |
"epoch": 5.856515373352855,
|
73 |
+
"grad_norm": 0.08060992509126663,
|
74 |
+
"learning_rate": 1.0917042498003083e-05,
|
75 |
+
"loss": 0.0779,
|
76 |
"step": 500
|
77 |
},
|
78 |
{
|
79 |
"epoch": 5.997071742313324,
|
80 |
+
"eval_accuracy": 0.9904761904761905,
|
81 |
+
"eval_f1": 0.9904879940792306,
|
82 |
+
"eval_loss": 0.0396205335855484,
|
83 |
+
"eval_precision": 0.9905117057078526,
|
84 |
+
"eval_recall": 0.9904761904761905,
|
85 |
+
"eval_runtime": 5.9047,
|
86 |
+
"eval_samples_per_second": 231.172,
|
87 |
+
"eval_steps_per_second": 28.96,
|
88 |
"step": 512
|
89 |
},
|
90 |
{
|
91 |
"epoch": 6.992679355783309,
|
92 |
+
"eval_accuracy": 0.991941391941392,
|
93 |
+
"eval_f1": 0.9919447375447602,
|
94 |
+
"eval_loss": 0.035047151148319244,
|
95 |
+
"eval_precision": 0.9919494135494136,
|
96 |
+
"eval_recall": 0.991941391941392,
|
97 |
+
"eval_runtime": 6.0502,
|
98 |
+
"eval_samples_per_second": 225.612,
|
99 |
+
"eval_steps_per_second": 28.264,
|
100 |
"step": 597
|
101 |
},
|
102 |
{
|
103 |
"epoch": 8.0,
|
104 |
+
"eval_accuracy": 0.9912087912087912,
|
105 |
+
"eval_f1": 0.9912160728160728,
|
106 |
+
"eval_loss": 0.03350323066115379,
|
107 |
+
"eval_precision": 0.9912286614059304,
|
108 |
+
"eval_recall": 0.9912087912087912,
|
109 |
+
"eval_runtime": 5.79,
|
110 |
+
"eval_samples_per_second": 235.751,
|
111 |
+
"eval_steps_per_second": 29.534,
|
112 |
"step": 683
|
113 |
}
|
114 |
],
|
checkpoint-683/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5240
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
|
3 |
size 5240
|
checkpoint-768/config.json
CHANGED
@@ -45,6 +45,7 @@
|
|
45 |
"feat_proj_dropout": 0.0,
|
46 |
"feat_proj_layer_norm": false,
|
47 |
"final_dropout": 0.0,
|
|
|
48 |
"hidden_act": "gelu",
|
49 |
"hidden_dropout": 0.1,
|
50 |
"hidden_size": 768,
|
@@ -54,10 +55,6 @@
|
|
54 |
},
|
55 |
"initializer_range": 0.02,
|
56 |
"intermediate_size": 3072,
|
57 |
-
"label2id": {
|
58 |
-
"crying": "0",
|
59 |
-
"no_crying": "1"
|
60 |
-
},
|
61 |
"layer_norm_eps": 1e-05,
|
62 |
"layerdrop": 0.0,
|
63 |
"mask_feature_length": 10,
|
|
|
45 |
"feat_proj_dropout": 0.0,
|
46 |
"feat_proj_layer_norm": false,
|
47 |
"final_dropout": 0.0,
|
48 |
+
"finetuning_task": "audio-classification",
|
49 |
"hidden_act": "gelu",
|
50 |
"hidden_dropout": 0.1,
|
51 |
"hidden_size": 768,
|
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
|
|
|
|
|
|
|
|
58 |
"layer_norm_eps": 1e-05,
|
59 |
"layerdrop": 0.0,
|
60 |
"mask_feature_length": 10,
|
checkpoint-768/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 94763496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:589720455553dad3b547e7fc5aac19151dbefadb26d39a6a04c708e344cfd310
|
3 |
size 94763496
|
checkpoint-768/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 189552570
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b863d95ad20867c4606dfd4b07ae1866e1bfbd283086e4449d924ccf79d9d2dc
|
3 |
size 189552570
|
checkpoint-768/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acb83cb237d82342af5936197af5c426903999a84d7161b385fa3b80c0070365
|
3 |
size 1064
|
checkpoint-768/trainer_state.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-
|
4 |
"epoch": 8.995607613469986,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 768,
|
@@ -10,90 +10,117 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
-
"eval_accuracy": 0.
|
14 |
-
"
|
15 |
-
"
|
16 |
-
"
|
17 |
-
"
|
|
|
|
|
|
|
18 |
"step": 85
|
19 |
},
|
20 |
{
|
21 |
"epoch": 1.9912152269399708,
|
22 |
-
"eval_accuracy": 0.
|
23 |
-
"
|
24 |
-
"
|
25 |
-
"
|
26 |
-
"
|
|
|
|
|
|
|
27 |
"step": 170
|
28 |
},
|
29 |
{
|
30 |
"epoch": 2.998535871156662,
|
31 |
-
"eval_accuracy": 0.
|
32 |
-
"
|
33 |
-
"
|
34 |
-
"
|
35 |
-
"
|
|
|
|
|
|
|
36 |
"step": 256
|
37 |
},
|
38 |
{
|
39 |
"epoch": 3.994143484626647,
|
40 |
-
"eval_accuracy": 0.
|
41 |
-
"
|
42 |
-
"
|
43 |
-
"
|
44 |
-
"
|
|
|
|
|
|
|
45 |
"step": 341
|
46 |
},
|
47 |
{
|
48 |
"epoch": 4.989751098096632,
|
49 |
-
"eval_accuracy": 0.
|
50 |
-
"
|
51 |
-
"
|
52 |
-
"
|
53 |
-
"
|
|
|
|
|
|
|
54 |
"step": 426
|
55 |
},
|
56 |
{
|
57 |
"epoch": 5.856515373352855,
|
58 |
-
"grad_norm": 0.
|
59 |
-
"learning_rate":
|
60 |
-
"loss": 0.
|
61 |
"step": 500
|
62 |
},
|
63 |
{
|
64 |
"epoch": 5.997071742313324,
|
65 |
-
"eval_accuracy": 0.
|
66 |
-
"
|
67 |
-
"
|
68 |
-
"
|
69 |
-
"
|
|
|
|
|
|
|
70 |
"step": 512
|
71 |
},
|
72 |
{
|
73 |
"epoch": 6.992679355783309,
|
74 |
-
"eval_accuracy": 0.
|
75 |
-
"
|
76 |
-
"
|
77 |
-
"
|
78 |
-
"
|
|
|
|
|
|
|
79 |
"step": 597
|
80 |
},
|
81 |
{
|
82 |
"epoch": 8.0,
|
83 |
-
"eval_accuracy": 0.
|
84 |
-
"
|
85 |
-
"
|
86 |
-
"
|
87 |
-
"
|
|
|
|
|
|
|
88 |
"step": 683
|
89 |
},
|
90 |
{
|
91 |
"epoch": 8.995607613469986,
|
92 |
-
"eval_accuracy": 0.
|
93 |
-
"
|
94 |
-
"
|
95 |
-
"
|
96 |
-
"
|
|
|
|
|
|
|
97 |
"step": 768
|
98 |
}
|
99 |
],
|
@@ -118,7 +145,7 @@
|
|
118 |
"should_evaluate": false,
|
119 |
"should_log": false,
|
120 |
"should_save": true,
|
121 |
-
"should_training_stop":
|
122 |
},
|
123 |
"attributes": {}
|
124 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.991941391941392,
|
3 |
+
"best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-597",
|
4 |
"epoch": 8.995607613469986,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 768,
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.9956076134699854,
|
13 |
+
"eval_accuracy": 0.9538461538461539,
|
14 |
+
"eval_f1": 0.9535883665206972,
|
15 |
+
"eval_loss": 0.11965569853782654,
|
16 |
+
"eval_precision": 0.9535470731605858,
|
17 |
+
"eval_recall": 0.9538461538461539,
|
18 |
+
"eval_runtime": 5.8661,
|
19 |
+
"eval_samples_per_second": 232.691,
|
20 |
+
"eval_steps_per_second": 29.15,
|
21 |
"step": 85
|
22 |
},
|
23 |
{
|
24 |
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9831501831501831,
|
26 |
+
"eval_f1": 0.983143153392684,
|
27 |
+
"eval_loss": 0.060115572065114975,
|
28 |
+
"eval_precision": 0.9831374404084774,
|
29 |
+
"eval_recall": 0.9831501831501831,
|
30 |
+
"eval_runtime": 5.9254,
|
31 |
+
"eval_samples_per_second": 230.365,
|
32 |
+
"eval_steps_per_second": 28.859,
|
33 |
"step": 170
|
34 |
},
|
35 |
{
|
36 |
"epoch": 2.998535871156662,
|
37 |
+
"eval_accuracy": 0.9868131868131869,
|
38 |
+
"eval_f1": 0.9868241092241091,
|
39 |
+
"eval_loss": 0.05060575157403946,
|
40 |
+
"eval_precision": 0.9868403029537207,
|
41 |
+
"eval_recall": 0.9868131868131869,
|
42 |
+
"eval_runtime": 5.9299,
|
43 |
+
"eval_samples_per_second": 230.189,
|
44 |
+
"eval_steps_per_second": 28.837,
|
45 |
"step": 256
|
46 |
},
|
47 |
{
|
48 |
"epoch": 3.994143484626647,
|
49 |
+
"eval_accuracy": 0.9860805860805861,
|
50 |
+
"eval_f1": 0.9861535269385863,
|
51 |
+
"eval_loss": 0.04610973969101906,
|
52 |
+
"eval_precision": 0.986445121171901,
|
53 |
+
"eval_recall": 0.9860805860805861,
|
54 |
+
"eval_runtime": 5.9428,
|
55 |
+
"eval_samples_per_second": 229.69,
|
56 |
+
"eval_steps_per_second": 28.774,
|
57 |
"step": 341
|
58 |
},
|
59 |
{
|
60 |
"epoch": 4.989751098096632,
|
61 |
+
"eval_accuracy": 0.989010989010989,
|
62 |
+
"eval_f1": 0.9890246085529585,
|
63 |
+
"eval_loss": 0.0438910573720932,
|
64 |
+
"eval_precision": 0.989050109460552,
|
65 |
+
"eval_recall": 0.989010989010989,
|
66 |
+
"eval_runtime": 5.937,
|
67 |
+
"eval_samples_per_second": 229.913,
|
68 |
+
"eval_steps_per_second": 28.802,
|
69 |
"step": 426
|
70 |
},
|
71 |
{
|
72 |
"epoch": 5.856515373352855,
|
73 |
+
"grad_norm": 0.08060992509126663,
|
74 |
+
"learning_rate": 1.0917042498003083e-05,
|
75 |
+
"loss": 0.0779,
|
76 |
"step": 500
|
77 |
},
|
78 |
{
|
79 |
"epoch": 5.997071742313324,
|
80 |
+
"eval_accuracy": 0.9904761904761905,
|
81 |
+
"eval_f1": 0.9904879940792306,
|
82 |
+
"eval_loss": 0.0396205335855484,
|
83 |
+
"eval_precision": 0.9905117057078526,
|
84 |
+
"eval_recall": 0.9904761904761905,
|
85 |
+
"eval_runtime": 5.9047,
|
86 |
+
"eval_samples_per_second": 231.172,
|
87 |
+
"eval_steps_per_second": 28.96,
|
88 |
"step": 512
|
89 |
},
|
90 |
{
|
91 |
"epoch": 6.992679355783309,
|
92 |
+
"eval_accuracy": 0.991941391941392,
|
93 |
+
"eval_f1": 0.9919447375447602,
|
94 |
+
"eval_loss": 0.035047151148319244,
|
95 |
+
"eval_precision": 0.9919494135494136,
|
96 |
+
"eval_recall": 0.991941391941392,
|
97 |
+
"eval_runtime": 6.0502,
|
98 |
+
"eval_samples_per_second": 225.612,
|
99 |
+
"eval_steps_per_second": 28.264,
|
100 |
"step": 597
|
101 |
},
|
102 |
{
|
103 |
"epoch": 8.0,
|
104 |
+
"eval_accuracy": 0.9912087912087912,
|
105 |
+
"eval_f1": 0.9912160728160728,
|
106 |
+
"eval_loss": 0.03350323066115379,
|
107 |
+
"eval_precision": 0.9912286614059304,
|
108 |
+
"eval_recall": 0.9912087912087912,
|
109 |
+
"eval_runtime": 5.79,
|
110 |
+
"eval_samples_per_second": 235.751,
|
111 |
+
"eval_steps_per_second": 29.534,
|
112 |
"step": 683
|
113 |
},
|
114 |
{
|
115 |
"epoch": 8.995607613469986,
|
116 |
+
"eval_accuracy": 0.9912087912087912,
|
117 |
+
"eval_f1": 0.9912160728160728,
|
118 |
+
"eval_loss": 0.03368490934371948,
|
119 |
+
"eval_precision": 0.9912286614059304,
|
120 |
+
"eval_recall": 0.9912087912087912,
|
121 |
+
"eval_runtime": 5.7784,
|
122 |
+
"eval_samples_per_second": 236.224,
|
123 |
+
"eval_steps_per_second": 29.593,
|
124 |
"step": 768
|
125 |
}
|
126 |
],
|
|
|
145 |
"should_evaluate": false,
|
146 |
"should_log": false,
|
147 |
"should_save": true,
|
148 |
+
"should_training_stop": false
|
149 |
},
|
150 |
"attributes": {}
|
151 |
}
|
checkpoint-768/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5240
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
|
3 |
size 5240
|
checkpoint-85/config.json
CHANGED
@@ -55,10 +55,6 @@
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
58 |
-
"label2id": {
|
59 |
-
"crying": 0,
|
60 |
-
"no_crying": 1
|
61 |
-
},
|
62 |
"layer_norm_eps": 1e-05,
|
63 |
"layerdrop": 0.0,
|
64 |
"mask_feature_length": 10,
|
|
|
55 |
},
|
56 |
"initializer_range": 0.02,
|
57 |
"intermediate_size": 3072,
|
|
|
|
|
|
|
|
|
58 |
"layer_norm_eps": 1e-05,
|
59 |
"layerdrop": 0.0,
|
60 |
"mask_feature_length": 10,
|
checkpoint-85/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 94763496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23b104b8e2a8ab0ab3becb4267c1082a46bc58158acb8a209710fb47609d3b4f
|
3 |
size 94763496
|