toghrultahirov commited on
Commit
ba87c00
1 Parent(s): ca72978

Training complete

Browse files
README.md CHANGED
@@ -20,11 +20,11 @@ should probably proofread and complete it, then remove this comment. -->
20
 
21
  This model is a fine-tuned version of [google-bert/bert-base-multilingual-cased](https://huggingface.co/google-bert/bert-base-multilingual-cased) on an unknown dataset.
22
  It achieves the following results on the evaluation set:
23
- - Loss: 0.1283
24
- - Precision: 0.8888
25
- - Recall: 0.9033
26
- - F1: 0.8960
27
- - Accuracy: 0.9656
28
 
29
  ## Model description
30
 
@@ -44,22 +44,32 @@ More information needed
44
 
45
  The following hyperparameters were used during training:
46
  - learning_rate: 3e-05
47
- - train_batch_size: 64
48
- - eval_batch_size: 64
49
  - seed: 42
50
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
51
  - lr_scheduler_type: reduce_lr_on_plateau
52
- - num_epochs: 5
53
 
54
  ### Training results
55
 
56
  | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Accuracy |
57
  |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
58
- | No log | 1.0 | 157 | 0.1525 | 0.8593 | 0.8675 | 0.8634 | 0.9550 |
59
- | No log | 2.0 | 314 | 0.1343 | 0.8706 | 0.9106 | 0.8902 | 0.9620 |
60
- | No log | 3.0 | 471 | 0.1283 | 0.8888 | 0.9033 | 0.8960 | 0.9656 |
61
- | 0.1657 | 4.0 | 628 | 0.1483 | 0.8703 | 0.9145 | 0.8918 | 0.9621 |
62
- | 0.1657 | 5.0 | 785 | 0.1563 | 0.8742 | 0.9141 | 0.8937 | 0.9644 |
 
 
 
 
 
 
 
 
 
 
63
 
64
 
65
  ### Framework versions
 
20
 
21
  This model is a fine-tuned version of [google-bert/bert-base-multilingual-cased](https://huggingface.co/google-bert/bert-base-multilingual-cased) on an unknown dataset.
22
  It achieves the following results on the evaluation set:
23
+ - Loss: 0.1319
24
+ - Precision: 0.8726
25
+ - Recall: 0.9026
26
+ - F1: 0.8874
27
+ - Accuracy: 0.9619
28
 
29
  ## Model description
30
 
 
44
 
45
  The following hyperparameters were used during training:
46
  - learning_rate: 3e-05
47
+ - train_batch_size: 32
48
+ - eval_batch_size: 32
49
  - seed: 42
50
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
51
  - lr_scheduler_type: reduce_lr_on_plateau
52
+ - num_epochs: 15
53
 
54
  ### Training results
55
 
56
  | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Accuracy |
57
  |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
58
+ | No log | 1.0 | 313 | 0.1464 | 0.8797 | 0.8615 | 0.8705 | 0.9587 |
59
+ | 0.2128 | 2.0 | 626 | 0.1319 | 0.8726 | 0.9026 | 0.8874 | 0.9619 |
60
+ | 0.2128 | 3.0 | 939 | 0.1461 | 0.8689 | 0.8924 | 0.8805 | 0.9596 |
61
+ | 0.0783 | 4.0 | 1252 | 0.1529 | 0.8837 | 0.9049 | 0.8942 | 0.9620 |
62
+ | 0.0443 | 5.0 | 1565 | 0.1921 | 0.8657 | 0.9157 | 0.8900 | 0.9615 |
63
+ | 0.0443 | 6.0 | 1878 | 0.1647 | 0.8975 | 0.9224 | 0.9098 | 0.9685 |
64
+ | 0.0201 | 7.0 | 2191 | 0.1725 | 0.8904 | 0.9183 | 0.9041 | 0.9674 |
65
+ | 0.0098 | 8.0 | 2504 | 0.1766 | 0.8917 | 0.9199 | 0.9056 | 0.9682 |
66
+ | 0.0098 | 9.0 | 2817 | 0.1756 | 0.8926 | 0.9202 | 0.9062 | 0.9686 |
67
+ | 0.007 | 10.0 | 3130 | 0.1763 | 0.8916 | 0.9189 | 0.9051 | 0.9684 |
68
+ | 0.007 | 11.0 | 3443 | 0.1772 | 0.8907 | 0.9183 | 0.9043 | 0.9682 |
69
+ | 0.007 | 12.0 | 3756 | 0.1773 | 0.8895 | 0.9173 | 0.9032 | 0.9680 |
70
+ | 0.0067 | 13.0 | 4069 | 0.1775 | 0.8892 | 0.9170 | 0.9029 | 0.9680 |
71
+ | 0.0067 | 14.0 | 4382 | 0.1775 | 0.8897 | 0.9170 | 0.9032 | 0.9679 |
72
+ | 0.0062 | 15.0 | 4695 | 0.1775 | 0.8897 | 0.9170 | 0.9032 | 0.9679 |
73
 
74
 
75
  ### Framework versions
config.json CHANGED
@@ -11,22 +11,22 @@
11
  "hidden_size": 768,
12
  "id2label": {
13
  "0": "O",
14
- "1": "B-PER",
15
- "2": "I-PER",
16
  "3": "B-LOC",
17
  "4": "I-LOC",
18
- "5": "B-ORG",
19
- "6": "I-ORG"
20
  },
21
  "initializer_range": 0.02,
22
  "intermediate_size": 3072,
23
  "label2id": {
24
  "B-LOC": 3,
25
- "B-ORG": 5,
26
- "B-PER": 1,
27
  "I-LOC": 4,
28
- "I-ORG": 6,
29
- "I-PER": 2,
30
  "O": 0
31
  },
32
  "layer_norm_eps": 1e-12,
@@ -42,7 +42,7 @@
42
  "pooler_type": "first_token_transform",
43
  "position_embedding_type": "absolute",
44
  "torch_dtype": "float32",
45
- "transformers_version": "4.40.2",
46
  "type_vocab_size": 2,
47
  "use_cache": true,
48
  "vocab_size": 119547
 
11
  "hidden_size": 768,
12
  "id2label": {
13
  "0": "O",
14
+ "1": "B-ORG",
15
+ "2": "I-ORG",
16
  "3": "B-LOC",
17
  "4": "I-LOC",
18
+ "5": "B-PER",
19
+ "6": "I-PER"
20
  },
21
  "initializer_range": 0.02,
22
  "intermediate_size": 3072,
23
  "label2id": {
24
  "B-LOC": 3,
25
+ "B-ORG": 1,
26
+ "B-PER": 5,
27
  "I-LOC": 4,
28
+ "I-ORG": 2,
29
+ "I-PER": 6,
30
  "O": 0
31
  },
32
  "layer_norm_eps": 1e-12,
 
42
  "pooler_type": "first_token_transform",
43
  "position_embedding_type": "absolute",
44
  "torch_dtype": "float32",
45
+ "transformers_version": "4.41.0",
46
  "type_vocab_size": 2,
47
  "use_cache": true,
48
  "vocab_size": 119547
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4e185154dc8f18bc11da79db5384fecba22e9db276e215a7d8c94e9599d11e9
3
  size 709096284
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42150f376fc5de08f0b0ea7b48f3e1c6c0ddf35f5edf41722d97ebc6ba55de9b
3
  size 709096284
runs/May23_15-45-38_9d80cb969c0a/events.out.tfevents.1716480282.9d80cb969c0a.20961.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfe19decf16cfb62f8fa8fa27cacafcd5d3bba683220218198a9273dfa5ea788
3
+ size 560
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ffe3a8c9513ba194945196091f9c43e359ea408a82468c1cd63dc6aa033b484
3
- size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec6bead204e8da5a4f809eeb3956d4188275a564f78ba274faaadeaf7b8730a6
3
+ size 5176