End of training

Browse files

Files changed (9) hide show

.gitattributes +1 -0
README.md +165 -0
config.json +37 -0
model.safetensors +3 -0
sentencepiece.bpe.model +3 -0
special_tokens_map.json +15 -0
tokenizer.json +3 -0
tokenizer_config.json +55 -0
training_args.bin +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,165 @@

+---
+license: mit
+base_model: microsoft/Multilingual-MiniLM-L12-H384
+tags:
+- generated_from_trainer
+metrics:
+- precision
+- recall
+- f1
+- accuracy
+model-index:
+- name: ner-coin-v2
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# ner-coin-v2
+This model is a fine-tuned version of [microsoft/Multilingual-MiniLM-L12-H384](https://huggingface.co/microsoft/Multilingual-MiniLM-L12-H384) on the None dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.0182
+- Precision: 0.9837
+- Recall: 0.9947
+- F1: 0.9892
+- Accuracy: 0.9971
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 5e-05
+- train_batch_size: 64
+- eval_batch_size: 64
+- seed: 42
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- num_epochs: 100
+### Training results
+| Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1     | Accuracy |
+|:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
+| No log        | 1.0   | 51   | 0.2140          | 0.7507    | 0.8582 | 0.8008 | 0.9790   |
+| No log        | 2.0   | 102  | 0.1401          | 0.9631    | 0.9790 | 0.9710 | 0.9936   |
+| No log        | 3.0   | 153  | 0.1071          | 0.9710    | 0.9790 | 0.9750 | 0.9945   |
+| No log        | 4.0   | 204  | 0.0852          | 0.9676    | 0.9857 | 0.9766 | 0.9948   |
+| No log        | 5.0   | 255  | 0.0712          | 0.9741    | 0.9880 | 0.9810 | 0.9953   |
+| No log        | 6.0   | 306  | 0.0586          | 0.9842    | 0.9820 | 0.9831 | 0.9962   |
+| No log        | 7.0   | 357  | 0.0514          | 0.9799    | 0.9865 | 0.9832 | 0.9960   |
+| No log        | 8.0   | 408  | 0.0472          | 0.9778    | 0.9895 | 0.9836 | 0.9957   |
+| No log        | 9.0   | 459  | 0.0428          | 0.9749    | 0.9895 | 0.9821 | 0.9956   |
+| 0.1133        | 10.0  | 510  | 0.0393          | 0.9864    | 0.9782 | 0.9823 | 0.9956   |
+| 0.1133        | 11.0  | 561  | 0.0342          | 0.9828    | 0.9857 | 0.9843 | 0.9959   |
+| 0.1133        | 12.0  | 612  | 0.0307          | 0.9806    | 0.9880 | 0.9843 | 0.9964   |
+| 0.1133        | 13.0  | 663  | 0.0302          | 0.9748    | 0.9880 | 0.9814 | 0.9956   |
+| 0.1133        | 14.0  | 714  | 0.0295          | 0.9677    | 0.9895 | 0.9785 | 0.9948   |
+| 0.1133        | 15.0  | 765  | 0.0256          | 0.9828    | 0.9872 | 0.9850 | 0.9964   |
+| 0.1133        | 16.0  | 816  | 0.0295          | 0.9601    | 0.9932 | 0.9764 | 0.9939   |
+| 0.1133        | 17.0  | 867  | 0.0252          | 0.9784    | 0.9865 | 0.9824 | 0.9958   |
+| 0.1133        | 18.0  | 918  | 0.0289          | 0.9819    | 0.9775 | 0.9797 | 0.9948   |
+| 0.1133        | 19.0  | 969  | 0.0248          | 0.9798    | 0.9842 | 0.9820 | 0.9954   |
+| 0.0217        | 20.0  | 1020 | 0.0254          | 0.9741    | 0.9880 | 0.9810 | 0.9950   |
+| 0.0217        | 21.0  | 1071 | 0.0219          | 0.9749    | 0.9902 | 0.9825 | 0.9956   |
+| 0.0217        | 22.0  | 1122 | 0.0240          | 0.9770    | 0.9887 | 0.9828 | 0.9955   |
+| 0.0217        | 23.0  | 1173 | 0.0226          | 0.9807    | 0.9887 | 0.9847 | 0.9958   |
+| 0.0217        | 24.0  | 1224 | 0.0209          | 0.9756    | 0.9910 | 0.9833 | 0.9957   |
+| 0.0217        | 25.0  | 1275 | 0.0203          | 0.9822    | 0.9917 | 0.9869 | 0.9963   |
+| 0.0217        | 26.0  | 1326 | 0.0231          | 0.9727    | 0.9902 | 0.9814 | 0.9950   |
+| 0.0217        | 27.0  | 1377 | 0.0204          | 0.9778    | 0.9895 | 0.9836 | 0.9958   |
+| 0.0217        | 28.0  | 1428 | 0.0196          | 0.9771    | 0.9917 | 0.9844 | 0.9962   |
+| 0.0217        | 29.0  | 1479 | 0.0206          | 0.9757    | 0.9932 | 0.9844 | 0.9957   |
+| 0.0097        | 30.0  | 1530 | 0.0217          | 0.9757    | 0.9955 | 0.9855 | 0.9959   |
+| 0.0097        | 31.0  | 1581 | 0.0192          | 0.9843    | 0.9872 | 0.9858 | 0.9962   |
+| 0.0097        | 32.0  | 1632 | 0.0189          | 0.9844    | 0.9910 | 0.9877 | 0.9964   |
+| 0.0097        | 33.0  | 1683 | 0.0174          | 0.9844    | 0.9925 | 0.9884 | 0.9966   |
+| 0.0097        | 34.0  | 1734 | 0.0183          | 0.9836    | 0.9910 | 0.9873 | 0.9966   |
+| 0.0097        | 35.0  | 1785 | 0.0189          | 0.9785    | 0.9917 | 0.9851 | 0.9964   |
+| 0.0097        | 36.0  | 1836 | 0.0202          | 0.9757    | 0.9940 | 0.9848 | 0.9960   |
+| 0.0097        | 37.0  | 1887 | 0.0203          | 0.9770    | 0.9880 | 0.9825 | 0.9957   |
+| 0.0097        | 38.0  | 1938 | 0.0189          | 0.9778    | 0.9932 | 0.9855 | 0.9962   |
+| 0.0097        | 39.0  | 1989 | 0.0169          | 0.9836    | 0.9895 | 0.9865 | 0.9966   |
+| 0.0055        | 40.0  | 2040 | 0.0183          | 0.9778    | 0.9917 | 0.9847 | 0.9961   |
+| 0.0055        | 41.0  | 2091 | 0.0159          | 0.9866    | 0.9910 | 0.9888 | 0.9968   |
+| 0.0055        | 42.0  | 2142 | 0.0175          | 0.9778    | 0.9917 | 0.9847 | 0.9962   |
+| 0.0055        | 43.0  | 2193 | 0.0153          | 0.9829    | 0.9940 | 0.9884 | 0.9969   |
+| 0.0055        | 44.0  | 2244 | 0.0170          | 0.9778    | 0.9925 | 0.9851 | 0.9963   |
+| 0.0055        | 45.0  | 2295 | 0.0184          | 0.9750    | 0.9940 | 0.9844 | 0.9962   |
+| 0.0055        | 46.0  | 2346 | 0.0172          | 0.9786    | 0.9940 | 0.9862 | 0.9964   |
+| 0.0055        | 47.0  | 2397 | 0.0174          | 0.9779    | 0.9947 | 0.9862 | 0.9965   |
+| 0.0055        | 48.0  | 2448 | 0.0169          | 0.9778    | 0.9910 | 0.9844 | 0.9962   |
+| 0.0055        | 49.0  | 2499 | 0.0193          | 0.9701    | 0.9962 | 0.9830 | 0.9958   |
+| 0.0035        | 50.0  | 2550 | 0.0163          | 0.9792    | 0.9910 | 0.9851 | 0.9963   |
+| 0.0035        | 51.0  | 2601 | 0.0173          | 0.9771    | 0.9925 | 0.9847 | 0.9960   |
+| 0.0035        | 52.0  | 2652 | 0.0164          | 0.9829    | 0.9932 | 0.9881 | 0.9966   |
+| 0.0035        | 53.0  | 2703 | 0.0177          | 0.9757    | 0.9955 | 0.9855 | 0.9961   |
+| 0.0035        | 54.0  | 2754 | 0.0164          | 0.9815    | 0.9932 | 0.9873 | 0.9965   |
+| 0.0035        | 55.0  | 2805 | 0.0171          | 0.9793    | 0.9947 | 0.9870 | 0.9966   |
+| 0.0035        | 56.0  | 2856 | 0.0175          | 0.98      | 0.9925 | 0.9862 | 0.9966   |
+| 0.0035        | 57.0  | 2907 | 0.0167          | 0.9801    | 0.9955 | 0.9877 | 0.9966   |
+| 0.0035        | 58.0  | 2958 | 0.0168          | 0.9880    | 0.9887 | 0.9884 | 0.9966   |
+| 0.0025        | 59.0  | 3009 | 0.0174          | 0.9858    | 0.9917 | 0.9888 | 0.9969   |
+| 0.0025        | 60.0  | 3060 | 0.0153          | 0.9837    | 0.9940 | 0.9888 | 0.9970   |
+| 0.0025        | 61.0  | 3111 | 0.0165          | 0.9829    | 0.9932 | 0.9881 | 0.9968   |
+| 0.0025        | 62.0  | 3162 | 0.0150          | 0.9881    | 0.9925 | 0.9903 | 0.9971   |
+| 0.0025        | 63.0  | 3213 | 0.0156          | 0.9851    | 0.9947 | 0.9899 | 0.9972   |
+| 0.0025        | 64.0  | 3264 | 0.0147          | 0.9873    | 0.9940 | 0.9907 | 0.9974   |
+| 0.0025        | 65.0  | 3315 | 0.0169          | 0.9815    | 0.9947 | 0.9881 | 0.9967   |
+| 0.0025        | 66.0  | 3366 | 0.0186          | 0.9786    | 0.9962 | 0.9874 | 0.9964   |
+| 0.0025        | 67.0  | 3417 | 0.0171          | 0.9815    | 0.9940 | 0.9877 | 0.9967   |
+| 0.0025        | 68.0  | 3468 | 0.0164          | 0.9822    | 0.9932 | 0.9877 | 0.9966   |
+| 0.0021        | 69.0  | 3519 | 0.0161          | 0.9829    | 0.9932 | 0.9881 | 0.9968   |
+| 0.0021        | 70.0  | 3570 | 0.0156          | 0.9858    | 0.9925 | 0.9892 | 0.9970   |
+| 0.0021        | 71.0  | 3621 | 0.0163          | 0.9815    | 0.9947 | 0.9881 | 0.9967   |
+| 0.0021        | 72.0  | 3672 | 0.0166          | 0.9837    | 0.9947 | 0.9892 | 0.9970   |
+| 0.0021        | 73.0  | 3723 | 0.0161          | 0.9866    | 0.9925 | 0.9895 | 0.9970   |
+| 0.0021        | 74.0  | 3774 | 0.0165          | 0.9837    | 0.9947 | 0.9892 | 0.9970   |
+| 0.0021        | 75.0  | 3825 | 0.0165          | 0.9859    | 0.9947 | 0.9903 | 0.9972   |
+| 0.0021        | 76.0  | 3876 | 0.0170          | 0.9830    | 0.9947 | 0.9888 | 0.9969   |
+| 0.0021        | 77.0  | 3927 | 0.0171          | 0.9844    | 0.9947 | 0.9896 | 0.9971   |
+| 0.0021        | 78.0  | 3978 | 0.0179          | 0.9815    | 0.9947 | 0.9881 | 0.9967   |
+| 0.0016        | 79.0  | 4029 | 0.0170          | 0.9851    | 0.9947 | 0.9899 | 0.9971   |
+| 0.0016        | 80.0  | 4080 | 0.0170          | 0.9851    | 0.9947 | 0.9899 | 0.9971   |
+| 0.0016        | 81.0  | 4131 | 0.0186          | 0.9779    | 0.9955 | 0.9866 | 0.9963   |
+| 0.0016        | 82.0  | 4182 | 0.0179          | 0.9822    | 0.9947 | 0.9884 | 0.9968   |
+| 0.0016        | 83.0  | 4233 | 0.0177          | 0.9822    | 0.9947 | 0.9884 | 0.9968   |
+| 0.0016        | 84.0  | 4284 | 0.0177          | 0.9822    | 0.9947 | 0.9884 | 0.9968   |
+| 0.0016        | 85.0  | 4335 | 0.0176          | 0.9830    | 0.9947 | 0.9888 | 0.9969   |
+| 0.0016        | 86.0  | 4386 | 0.0182          | 0.9822    | 0.9947 | 0.9884 | 0.9968   |
+| 0.0016        | 87.0  | 4437 | 0.0173          | 0.9851    | 0.9947 | 0.9899 | 0.9971   |
+| 0.0016        | 88.0  | 4488 | 0.0179          | 0.9808    | 0.9947 | 0.9877 | 0.9966   |
+| 0.0015        | 89.0  | 4539 | 0.0176          | 0.9837    | 0.9947 | 0.9892 | 0.9970   |
+| 0.0015        | 90.0  | 4590 | 0.0181          | 0.9837    | 0.9947 | 0.9892 | 0.9970   |
+| 0.0015        | 91.0  | 4641 | 0.0183          | 0.9837    | 0.9947 | 0.9892 | 0.9970   |
+| 0.0015        | 92.0  | 4692 | 0.0183          | 0.9844    | 0.9947 | 0.9896 | 0.9971   |
+| 0.0015        | 93.0  | 4743 | 0.0188          | 0.9837    | 0.9947 | 0.9892 | 0.9969   |
+| 0.0015        | 94.0  | 4794 | 0.0189          | 0.9837    | 0.9947 | 0.9892 | 0.9969   |
+| 0.0015        | 95.0  | 4845 | 0.0186          | 0.9837    | 0.9947 | 0.9892 | 0.9969   |
+| 0.0015        | 96.0  | 4896 | 0.0180          | 0.9837    | 0.9947 | 0.9892 | 0.9971   |
+| 0.0015        | 97.0  | 4947 | 0.0181          | 0.9837    | 0.9947 | 0.9892 | 0.9970   |
+| 0.0015        | 98.0  | 4998 | 0.0182          | 0.9837    | 0.9947 | 0.9892 | 0.9970   |
+| 0.0013        | 99.0  | 5049 | 0.0182          | 0.9837    | 0.9947 | 0.9892 | 0.9971   |
+| 0.0013        | 100.0 | 5100 | 0.0182          | 0.9837    | 0.9947 | 0.9892 | 0.9971   |
+### Framework versions
+- Transformers 4.40.2
+- Pytorch 2.1.0+cu121
+- Datasets 2.14.5
+- Tokenizers 0.19.1

config.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "_name_or_path": "microsoft/Multilingual-MiniLM-L12-H384",
+  "architectures": [
+    "BertForTokenClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "finetuning_task": "ner",
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 384,
+  "id2label": {
+    "0": "O",
+    "1": "I-COIN",
+    "2": "B-COIN"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 1536,
+  "label2id": {
+    "B-COIN": 2,
+    "I-COIN": 1,
+    "O": 0
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "tokenizer_class": "XLMRobertaTokenizer",
+  "torch_dtype": "float32",
+  "transformers_version": "4.40.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 250037
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d90635090e7911c6a2e8b17fe84ca3844218f50d85ecc9fdc2c6fc577e523799
+size 470051652

sentencepiece.bpe.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "unk_token": "<unk>"
+}

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b74659c780d49afad7a7b9799868f75cbd3014fb6c34956e85a793028d38094a
+size 17098251

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "250001": {
+      "content": "<mask>",
+      "lstrip": true,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": "<mask>",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "XLMRobertaTokenizer",
+  "unk_token": "<unk>"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:79a5d9d371236acdd673b0daf320aadfc499dd5615060dfefde91cfe7d33e2e0
+size 4984