eskayML/bert_interview_new

Files changed (5) hide show

README.md CHANGED Viewed

@@ -18,8 +18,8 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.4570
-- Accuracy: 0.8611
 ## Model description
@@ -50,21 +50,21 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:--------:|
-| No log        | 1.0   | 54   | 2.2496          | 0.2593   |
-| No log        | 2.0   | 108  | 2.1561          | 0.4444   |
-| No log        | 3.0   | 162  | 2.0315          | 0.5648   |
-| No log        | 4.0   | 216  | 1.9100          | 0.6852   |
-| No log        | 5.0   | 270  | 1.7820          | 0.7870   |
-| No log        | 6.0   | 324  | 1.6627          | 0.8056   |
-| No log        | 7.0   | 378  | 1.5728          | 0.8519   |
-| No log        | 8.0   | 432  | 1.5169          | 0.8611   |
-| No log        | 9.0   | 486  | 1.4705          | 0.8611   |
-| 1.9122        | 10.0  | 540  | 1.4570          | 0.8611   |
 ### Framework versions
-- Transformers 4.46.2
 - Pytorch 2.5.1+cu121
-- Datasets 3.1.0
-- Tokenizers 0.20.3

 This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.7181
+- Accuracy: 0.8362
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:--------:|
+| 2.5731        | 1.0   | 579  | 2.3539          | 0.2888   |
+| 2.2431        | 2.0   | 1158 | 1.8700          | 0.4526   |
+| 1.8916        | 3.0   | 1737 | 1.5977          | 0.5302   |
+| 1.5897        | 4.0   | 2316 | 1.2684          | 0.6509   |
+| 1.485         | 5.0   | 2895 | 1.0863          | 0.6724   |
+| 1.282         | 6.0   | 3474 | 0.9135          | 0.7716   |
+| 1.0021        | 7.0   | 4053 | 0.8167          | 0.8103   |
+| 0.9446        | 8.0   | 4632 | 0.7997          | 0.8017   |
+| 0.8573        | 9.0   | 5211 | 0.7286          | 0.8319   |
+| 0.8327        | 10.0  | 5790 | 0.7181          | 0.8362   |
 ### Framework versions
+- Transformers 4.47.1
 - Pytorch 2.5.1+cu121
+- Datasets 3.2.0
+- Tokenizers 0.21.0

config.json CHANGED Viewed

@@ -9,29 +9,49 @@
   "dropout": 0.1,
   "hidden_dim": 3072,
   "id2label": {
-    "0": "Provider Characteristics",
-    "1": "Finanicial Impact",
-    "2": "Imaging modalities in general",
-    "3": "Clinical utility & efficiency-Provider perspective",
-    "4": "Health System Characteristics",
-    "5": "Training",
-    "6": "Value equation",
-    "7": "Workflow related problems",
-    "8": "Credentialing / Quality Assurance Infrastructure",
-    "9": "Patient/Physican interaction in LUS"
   },
   "initializer_range": 0.02,
   "label2id": {
-    "Clinical utility & efficiency-Provider perspective": 3,
-    "Credentialing / Quality Assurance Infrastructure": 8,
-    "Finanicial Impact": 1,
-    "Health System Characteristics": 4,
-    "Imaging modalities in general": 2,
-    "Patient/Physican interaction in LUS": 9,
-    "Provider Characteristics": 0,
-    "Training": 5,
-    "Value equation": 6,
-    "Workflow related problems": 7
   },
   "max_position_embeddings": 512,
   "model_type": "distilbert",
@@ -44,6 +64,6 @@
   "sinusoidal_pos_embds": false,
   "tie_weights_": true,
   "torch_dtype": "float32",
-  "transformers_version": "4.46.2",
   "vocab_size": 30522
 }

   "dropout": 0.1,
   "hidden_dim": 3072,
   "id2label": {
+    "0": 0,
+    "1": 1,
+    "2": 2,
+    "3": 3,
+    "4": 4,
+    "5": 5,
+    "6": 6,
+    "7": 7,
+    "8": 8,
+    "9": 9,
+    "10": 10,
+    "11": 11,
+    "12": 12,
+    "13": 13,
+    "14": 14,
+    "15": 15,
+    "16": 16,
+    "17": 17,
+    "18": 18,
+    "19": 19
   },
   "initializer_range": 0.02,
   "label2id": {
+    "0": 0,
+    "1": 1,
+    "2": 2,
+    "3": 3,
+    "4": 4,
+    "5": 5,
+    "6": 6,
+    "7": 7,
+    "8": 8,
+    "9": 9,
+    "10": 10,
+    "11": 11,
+    "12": 12,
+    "13": 13,
+    "14": 14,
+    "15": 15,
+    "16": 16,
+    "17": 17,
+    "18": 18,
+    "19": 19
   },
   "max_position_embeddings": 512,
   "model_type": "distilbert",
   "sinusoidal_pos_embds": false,
   "tie_weights_": true,
   "torch_dtype": "float32",
+  "transformers_version": "4.47.1",
   "vocab_size": 30522
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5781acb0a050967ce595023e4e53272afd7e4938875b97822b967b8a91830c7e
-size 267857176

 version https://git-lfs.github.com/spec/v1
+oid sha256:787125a1a263020e64363a71de35d5f07c6ea241495191b65f21ebed48f5094c
+size 267887936

tokenizer_config.json CHANGED Viewed

@@ -44,6 +44,7 @@
   "clean_up_tokenization_spaces": false,
   "cls_token": "[CLS]",
   "do_lower_case": true,
   "mask_token": "[MASK]",
   "max_length": 512,
   "model_max_length": 512,

   "clean_up_tokenization_spaces": false,
   "cls_token": "[CLS]",
   "do_lower_case": true,
+  "extra_special_tokens": {},
   "mask_token": "[MASK]",
   "max_length": 512,
   "model_max_length": 512,

training_args.bin CHANGED Viewed

Binary files a/training_args.bin and b/training_args.bin differ