Training in progress, step 500

Browse files

Files changed (5) hide show

README.md +14 -17
config.json +1 -31
model.safetensors +2 -2
runs/Oct10_01-15-06_aura.fi.muni.cz/events.out.tfevents.1728515711.aura.fi.muni.cz.2703744.0 +3 -0
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -20,12 +20,11 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [zhihan1996/DNA_bert_6](https://huggingface.co/zhihan1996/DNA_bert_6) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.9545
-- Accuracy: 0.6326
-- Precision: 0.7326
-- Recall: 0.7248
-- F1: 0.7187
-- Mcc: 0.6857
 ## Model description
@@ -54,17 +53,15 @@ The following hyperparameters were used during training:
 ### Training results
-| Training Loss | Epoch  | Step | Validation Loss | Accuracy | Precision | Recall | F1     | Mcc    |
-|:-------------:|:------:|:----:|:---------------:|:--------:|:---------:|:------:|:------:|:------:|
-| 1.7375        | 0.4209 | 500  | 1.4156          | 0.3771   | 0.5528    | 0.5586 | 0.5239 | 0.4908 |
-| 1.334         | 0.8418 | 1000 | 1.2193          | 0.5040   | 0.6174    | 0.6212 | 0.6143 | 0.5661 |
-| 1.1545        | 1.2626 | 1500 | 1.1257          | 0.5406   | 0.6592    | 0.6543 | 0.6508 | 0.6037 |
-| 1.042         | 1.6835 | 2000 | 1.0398          | 0.5683   | 0.6838    | 0.6864 | 0.6739 | 0.6394 |
-| 0.9394        | 2.1044 | 2500 | 1.0141          | 0.5835   | 0.6974    | 0.6890 | 0.6809 | 0.6437 |
-| 0.8279        | 2.5253 | 3000 | 0.9895          | 0.6022   | 0.7070    | 0.7020 | 0.6934 | 0.6585 |
-| 0.8023        | 2.9461 | 3500 | 0.9273          | 0.6349   | 0.7246    | 0.7240 | 0.7189 | 0.6838 |
-| 0.6899        | 3.3670 | 4000 | 0.9374          | 0.6328   | 0.7272    | 0.7247 | 0.7194 | 0.6849 |
-| 0.6672        | 3.7879 | 4500 | 0.9545          | 0.6326   | 0.7326    | 0.7248 | 0.7187 | 0.6857 |
 ### Framework versions

 This model is a fine-tuned version of [zhihan1996/DNA_bert_6](https://huggingface.co/zhihan1996/DNA_bert_6) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.3621
+- Accuracy: 0.8538
+- Precision: 0.8812
+- Recall: 0.8210
+- F1: 0.8500
 ## Model description
 ### Training results
+| Training Loss | Epoch  | Step | Validation Loss | Accuracy | Precision | Recall | F1     |
+|:-------------:|:------:|:----:|:---------------:|:--------:|:---------:|:------:|:------:|
+| 0.5241        | 0.3946 | 500  | 0.4448          | 0.7869   | 0.8057    | 0.7614 | 0.7829 |
+| 0.4126        | 0.7893 | 1000 | 0.3896          | 0.8129   | 0.8379    | 0.7802 | 0.8080 |
+| 0.3527        | 1.1839 | 1500 | 0.3613          | 0.8367   | 0.8267    | 0.8558 | 0.8410 |
+| 0.3209        | 1.5785 | 2000 | 0.3744          | 0.8322   | 0.8702    | 0.7846 | 0.8252 |
+| 0.3075        | 1.9732 | 2500 | 0.3244          | 0.8545   | 0.8673    | 0.8403 | 0.8535 |
+| 0.2526        | 2.3678 | 3000 | 0.3407          | 0.8539   | 0.8595    | 0.8495 | 0.8544 |
+| 0.2512        | 2.7624 | 3500 | 0.3621          | 0.8538   | 0.8812    | 0.8210 | 0.8500 |
 ### Framework versions

config.json CHANGED Viewed

@@ -17,38 +17,8 @@
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
-  "id2label": {
-    "0": "LABEL_0",
-    "1": "LABEL_1",
-    "2": "LABEL_2",
-    "3": "LABEL_3",
-    "4": "LABEL_4",
-    "5": "LABEL_5",
-    "6": "LABEL_6",
-    "7": "LABEL_7",
-    "8": "LABEL_8",
-    "9": "LABEL_9",
-    "10": "LABEL_10",
-    "11": "LABEL_11",
-    "12": "LABEL_12"
-  },
   "initializer_range": 0.02,
   "intermediate_size": 3072,
-  "label2id": {
-    "LABEL_0": 0,
-    "LABEL_1": 1,
-    "LABEL_10": 10,
-    "LABEL_11": 11,
-    "LABEL_12": 12,
-    "LABEL_2": 2,
-    "LABEL_3": 3,
-    "LABEL_4": 4,
-    "LABEL_5": 5,
-    "LABEL_6": 6,
-    "LABEL_7": 7,
-    "LABEL_8": 8,
-    "LABEL_9": 9
-  },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
   "model_type": "bert",
@@ -58,7 +28,7 @@
   "output_past": true,
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
-  "problem_type": "multi_label_classification",
   "rnn": "lstm",
   "rnn_dropout": 0.0,
   "rnn_hidden": 768,

   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
   "model_type": "bert",
   "output_past": true,
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
   "rnn": "lstm",
   "rnn_dropout": 0.0,
   "rnn_hidden": 768,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ed0791527b896118ea31edbef3eaca2414f1703955c433c244ecd32b2d227392
-size 356827076

 version https://git-lfs.github.com/spec/v1
+oid sha256:a92472ced539c9ed12112d1438d0b130c44951287db768670582929089c67b45
+size 356793240

runs/Oct10_01-15-06_aura.fi.muni.cz/events.out.tfevents.1728515711.aura.fi.muni.cz.2703744.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d3ea952cdc52d3a22a3103edbc5db72bcab7feda8bc9bebff87dd00c6e0834e3
+size 6188

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:19be839c6b420bc29765950007a7d4d489872b31c62a0bccaea8cee5581aa46f
 size 4719

 version https://git-lfs.github.com/spec/v1
+oid sha256:5662e4985aecb11cdd9de961c61a71b4aa57d56799e2b3ddc56f4d9e79492415
 size 4719