Pablo94 commited on
Commit
826cfe1
1 Parent(s): d3bb0c8

Training in progress, epoch 1

Browse files
README.md ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ base_model: xlm-roberta-base
4
+ tags:
5
+ - generated_from_trainer
6
+ metrics:
7
+ - accuracy
8
+ - precision
9
+ - recall
10
+ model-index:
11
+ - name: xlm-roberta-base-finetuned-detests-wandb24
12
+ results: []
13
+ ---
14
+
15
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
16
+ should probably proofread and complete it, then remove this comment. -->
17
+
18
+ # xlm-roberta-base-finetuned-detests-wandb24
19
+
20
+ This model is a fine-tuned version of [xlm-roberta-base](https://huggingface.co/xlm-roberta-base) on the None dataset.
21
+ It achieves the following results on the evaluation set:
22
+ - Loss: 0.4371
23
+ - Accuracy: 0.7938
24
+ - F1-score: 0.7241
25
+ - Precision: 0.7136
26
+ - Recall: 0.7396
27
+ - Auc: 0.7396
28
+
29
+ ## Model description
30
+
31
+ More information needed
32
+
33
+ ## Intended uses & limitations
34
+
35
+ More information needed
36
+
37
+ ## Training and evaluation data
38
+
39
+ More information needed
40
+
41
+ ## Training procedure
42
+
43
+ ### Training hyperparameters
44
+
45
+ The following hyperparameters were used during training:
46
+ - learning_rate: 5e-05
47
+ - train_batch_size: 16
48
+ - eval_batch_size: 16
49
+ - seed: 42
50
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
51
+ - lr_scheduler_type: linear
52
+ - num_epochs: 2
53
+
54
+ ### Training results
55
+
56
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy | F1-score | Precision | Recall | Auc |
57
+ |:-------------:|:-----:|:----:|:---------------:|:--------:|:--------:|:---------:|:------:|:------:|
58
+ | 0.458 | 1.0 | 153 | 0.4512 | 0.7725 | 0.4358 | 0.3863 | 0.5 | 0.5 |
59
+ | 0.4262 | 2.0 | 306 | 0.4371 | 0.7938 | 0.7241 | 0.7136 | 0.7396 | 0.7396 |
60
+
61
+
62
+ ### Framework versions
63
+
64
+ - Transformers 4.37.2
65
+ - Pytorch 2.1.0+cu121
66
+ - Datasets 2.17.0
67
+ - Tokenizers 0.15.1
added_tokens.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "@usuario": 31002,
3
+ "emoji": 31005,
4
+ "hashtag": 31004,
5
+ "url": 31003
6
+ }
config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "finiteautomata/beto-sentiment-analysis",
3
+ "architectures": [
4
+ "BertForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "gradient_checkpointing": false,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 768,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-12,
15
+ "max_position_embeddings": 512,
16
+ "model_type": "bert",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "output_past": true,
20
+ "pad_token_id": 1,
21
+ "position_embedding_type": "absolute",
22
+ "problem_type": "single_label_classification",
23
+ "torch_dtype": "float32",
24
+ "transformers_version": "4.37.2",
25
+ "type_vocab_size": 2,
26
+ "use_cache": true,
27
+ "vocab_size": 31006
28
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:560de303b35b30b7d2b03c5cfa4e6492dba58ffe136838d84325966e23a4e340
3
+ size 439445496
runs/Feb12_09-39-40_93f51a08e000/events.out.tfevents.1707730980.93f51a08e000.1197.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29e970fcaa23ba6488b071bda1f199569abf6140cb145bbc03cb1d64fa21d0bc
3
+ size 7049
runs/Feb12_09-48-09_93f51a08e000/events.out.tfevents.1707731299.93f51a08e000.1197.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccb3aa453258cabb6f8fc87ccff9813ae003ee2066763ac5fdb8595d0ba11f74
3
+ size 7099
runs/Feb12_09-52-39_93f51a08e000/events.out.tfevents.1707731565.93f51a08e000.1197.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13b21529e804a993e9128799476e28f9f5b9d862cd1da89cde3d95a066f3e9f0
3
+ size 7026
runs/Feb12_09-57-03_93f51a08e000/events.out.tfevents.1707731829.93f51a08e000.1197.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e94493558f1ef8006fd3dcd25367220f38ba6b4b82e4dca7200d736eb9f01f3
3
+ size 7099
runs/Feb12_10-02-09_93f51a08e000/events.out.tfevents.1707732135.93f51a08e000.1197.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1797a15649ac7456a4cc9448d9d174e1e0cf5900ffdd63f1bd819c33a964e53
3
+ size 7049
runs/Feb12_10-06-36_93f51a08e000/events.out.tfevents.1707732411.93f51a08e000.1197.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cac9fc0cea880fe529e712c64cb99c5c05eb90c4011eebf2e4536e6c1d797c5
3
+ size 7055
runs/Feb12_10-15-15_93f51a08e000/events.out.tfevents.1707732920.93f51a08e000.1197.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbfa6a168f0fd8b786bc799a646063315b96e8528c40fc8d1ca3aae720c82860
3
+ size 6375
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
3
+ size 5069051
special_tokens_map.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[MASK]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "[PAD]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "3": {
20
+ "content": "[UNK]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "4": {
28
+ "content": "[CLS]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "5": {
36
+ "content": "[SEP]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ },
43
+ "31002": {
44
+ "content": "@usuario",
45
+ "lstrip": false,
46
+ "normalized": true,
47
+ "rstrip": false,
48
+ "single_word": false,
49
+ "special": false
50
+ },
51
+ "31003": {
52
+ "content": "url",
53
+ "lstrip": false,
54
+ "normalized": true,
55
+ "rstrip": false,
56
+ "single_word": false,
57
+ "special": false
58
+ },
59
+ "31004": {
60
+ "content": "hashtag",
61
+ "lstrip": false,
62
+ "normalized": true,
63
+ "rstrip": false,
64
+ "single_word": false,
65
+ "special": false
66
+ },
67
+ "31005": {
68
+ "content": "emoji",
69
+ "lstrip": false,
70
+ "normalized": true,
71
+ "rstrip": false,
72
+ "single_word": false,
73
+ "special": false
74
+ }
75
+ },
76
+ "clean_up_tokenization_spaces": true,
77
+ "cls_token": "[CLS]",
78
+ "do_basic_tokenize": true,
79
+ "do_lower_case": false,
80
+ "mask_token": "[MASK]",
81
+ "max_length": 128,
82
+ "model_max_length": 512,
83
+ "never_split": null,
84
+ "pad_token": "[PAD]",
85
+ "sep_token": "[SEP]",
86
+ "stride": 0,
87
+ "strip_accents": false,
88
+ "tokenize_chinese_chars": true,
89
+ "tokenizer_class": "BertTokenizer",
90
+ "truncation_side": "right",
91
+ "truncation_strategy": "longest_first",
92
+ "unk_token": "[UNK]"
93
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef7e15e5fc18349d3871ab6e2436ca32b9e187d7656ed9621c41bb156385ec5c
3
+ size 4728
vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
vocab.txt ADDED
The diff for this file is too large to render. See raw diff