mandasrinu commited on
Commit
9671df7
1 Parent(s): 58be993

End of training

Browse files
README.md ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ base_model: distilbert/distilbert-base-uncased
4
+ tags:
5
+ - generated_from_trainer
6
+ datasets:
7
+ - wnut_17
8
+ model-index:
9
+ - name: my_awesome_wnut_model
10
+ results: []
11
+ ---
12
+
13
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
14
+ should probably proofread and complete it, then remove this comment. -->
15
+
16
+ # my_awesome_wnut_model
17
+
18
+ This model is a fine-tuned version of [distilbert/distilbert-base-uncased](https://huggingface.co/distilbert/distilbert-base-uncased) on the wnut_17 dataset.
19
+ It achieves the following results on the evaluation set:
20
+ - eval_loss: 0.2751
21
+ - eval_precision: 0.5915
22
+ - eval_recall: 0.2456
23
+ - eval_f1: 0.3471
24
+ - eval_accuracy: 0.9388
25
+ - eval_runtime: 3.0704
26
+ - eval_samples_per_second: 419.16
27
+ - eval_steps_per_second: 26.381
28
+ - epoch: 1.0
29
+ - step: 213
30
+
31
+ ## Model description
32
+
33
+ More information needed
34
+
35
+ ## Intended uses & limitations
36
+
37
+ More information needed
38
+
39
+ ## Training and evaluation data
40
+
41
+ More information needed
42
+
43
+ ## Training procedure
44
+
45
+ ### Training hyperparameters
46
+
47
+ The following hyperparameters were used during training:
48
+ - learning_rate: 2e-05
49
+ - train_batch_size: 16
50
+ - eval_batch_size: 16
51
+ - seed: 42
52
+ - distributed_type: multi-GPU
53
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
54
+ - lr_scheduler_type: linear
55
+ - num_epochs: 2
56
+
57
+ ### Framework versions
58
+
59
+ - Transformers 4.36.1
60
+ - Pytorch 2.0.1+cu118
61
+ - Datasets 2.15.0
62
+ - Tokenizers 0.15.0
config.json ADDED
@@ -0,0 +1,54 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert/distilbert-base-uncased",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForTokenClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "0": "O",
13
+ "1": "B-corporation",
14
+ "2": "I-corporation",
15
+ "3": "B-creative-work",
16
+ "4": "I-creative-work",
17
+ "5": "B-group",
18
+ "6": "I-group",
19
+ "7": "B-location",
20
+ "8": "I-location",
21
+ "9": "B-person",
22
+ "10": "I-person",
23
+ "11": "B-product",
24
+ "12": "I-product"
25
+ },
26
+ "initializer_range": 0.02,
27
+ "label2id": {
28
+ "B-corporation": 1,
29
+ "B-creative-work": 3,
30
+ "B-group": 5,
31
+ "B-location": 7,
32
+ "B-person": 9,
33
+ "B-product": 11,
34
+ "I-corporation": 2,
35
+ "I-creative-work": 4,
36
+ "I-group": 6,
37
+ "I-location": 8,
38
+ "I-person": 10,
39
+ "I-product": 12,
40
+ "O": 0
41
+ },
42
+ "max_position_embeddings": 512,
43
+ "model_type": "distilbert",
44
+ "n_heads": 12,
45
+ "n_layers": 6,
46
+ "pad_token_id": 0,
47
+ "qa_dropout": 0.1,
48
+ "seq_classif_dropout": 0.2,
49
+ "sinusoidal_pos_embds": false,
50
+ "tie_weights_": true,
51
+ "torch_dtype": "float32",
52
+ "transformers_version": "4.36.1",
53
+ "vocab_size": 30522
54
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee418a99cf49d73de221ccd8ab39c5308f96bd018df899ea561aeba1ecbbe7fb
3
+ size 265503852
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tmp-checkpoint-213/config.json ADDED
@@ -0,0 +1,54 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert/distilbert-base-uncased",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForTokenClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "0": "O",
13
+ "1": "B-corporation",
14
+ "2": "I-corporation",
15
+ "3": "B-creative-work",
16
+ "4": "I-creative-work",
17
+ "5": "B-group",
18
+ "6": "I-group",
19
+ "7": "B-location",
20
+ "8": "I-location",
21
+ "9": "B-person",
22
+ "10": "I-person",
23
+ "11": "B-product",
24
+ "12": "I-product"
25
+ },
26
+ "initializer_range": 0.02,
27
+ "label2id": {
28
+ "B-corporation": 1,
29
+ "B-creative-work": 3,
30
+ "B-group": 5,
31
+ "B-location": 7,
32
+ "B-person": 9,
33
+ "B-product": 11,
34
+ "I-corporation": 2,
35
+ "I-creative-work": 4,
36
+ "I-group": 6,
37
+ "I-location": 8,
38
+ "I-person": 10,
39
+ "I-product": 12,
40
+ "O": 0
41
+ },
42
+ "max_position_embeddings": 512,
43
+ "model_type": "distilbert",
44
+ "n_heads": 12,
45
+ "n_layers": 6,
46
+ "pad_token_id": 0,
47
+ "qa_dropout": 0.1,
48
+ "seq_classif_dropout": 0.2,
49
+ "sinusoidal_pos_embds": false,
50
+ "tie_weights_": true,
51
+ "torch_dtype": "float32",
52
+ "transformers_version": "4.36.1",
53
+ "vocab_size": 30522
54
+ }
tmp-checkpoint-213/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee418a99cf49d73de221ccd8ab39c5308f96bd018df899ea561aeba1ecbbe7fb
3
+ size 265503852
tmp-checkpoint-213/special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tmp-checkpoint-213/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tmp-checkpoint-213/tokenizer_config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_lower_case": true,
47
+ "mask_token": "[MASK]",
48
+ "model_max_length": 1000000000000000019884624838656,
49
+ "pad_token": "[PAD]",
50
+ "sep_token": "[SEP]",
51
+ "strip_accents": null,
52
+ "tokenize_chinese_chars": true,
53
+ "tokenizer_class": "DistilBertTokenizer",
54
+ "unk_token": "[UNK]"
55
+ }
tmp-checkpoint-213/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96e8df02779413171f5114feb2c484d9c0270af9d38c0b2cad04c0ccf928d4f1
3
+ size 4283
tmp-checkpoint-213/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_lower_case": true,
47
+ "mask_token": "[MASK]",
48
+ "model_max_length": 1000000000000000019884624838656,
49
+ "pad_token": "[PAD]",
50
+ "sep_token": "[SEP]",
51
+ "strip_accents": null,
52
+ "tokenize_chinese_chars": true,
53
+ "tokenizer_class": "DistilBertTokenizer",
54
+ "unk_token": "[UNK]"
55
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96e8df02779413171f5114feb2c484d9c0270af9d38c0b2cad04c0ccf928d4f1
3
+ size 4283
vocab.txt ADDED
The diff for this file is too large to render. See raw diff