AI-4-Health/HPP-FINETUNED-Meta-Llama-3-8B-Instruct

Browse files

Files changed (7) hide show

README.md +7 -28
adapter_config.json +1 -2
adapter_model.safetensors +2 -2
runs/Jun13_07-27-50_jupiter/events.out.tfevents.1718234875.jupiter.364556.1 +3 -0
runs/Jun13_07-29-42_jupiter/events.out.tfevents.1718234993.jupiter.364556.2 +3 -0
tokenizer.json +6 -1
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -18,7 +18,12 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [meta-llama/Meta-Llama-3-8B-Instruct](https://huggingface.co/meta-llama/Meta-Llama-3-8B-Instruct) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 3.1279
 ## Model description
@@ -46,35 +51,9 @@ The following hyperparameters were used during training:
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - lr_scheduler_warmup_ratio: 0.05
-- num_epochs: 70
 - mixed_precision_training: Native AMP
-### Training results
-| Training Loss | Epoch   | Step | Validation Loss |
-|:-------------:|:-------:|:----:|:---------------:|
-| 1.3621        | 3.4964  | 420  | 1.4379          |
-| 1.1954        | 6.9927  | 840  | 1.4208          |
-| 0.8507        | 10.4891 | 1260 | 1.5712          |
-| 0.789         | 13.9854 | 1680 | 1.6759          |
-| 0.5388        | 17.4818 | 2100 | 1.9153          |
-| 0.4013        | 20.9781 | 2520 | 2.0319          |
-| 0.2933        | 24.4745 | 2940 | 2.2094          |
-| 0.207         | 27.9709 | 3360 | 2.3547          |
-| 0.1604        | 31.4672 | 3780 | 2.5483          |
-| 0.1154        | 34.9636 | 4200 | 2.5953          |
-| 0.0982        | 38.4599 | 4620 | 2.7355          |
-| 0.0954        | 41.9563 | 5040 | 2.8220          |
-| 0.0677        | 45.4527 | 5460 | 2.8909          |
-| 0.0613        | 48.9490 | 5880 | 2.9654          |
-| 0.0482        | 52.4454 | 6300 | 3.0125          |
-| 0.0415        | 55.9417 | 6720 | 3.0390          |
-| 0.0477        | 59.4381 | 7140 | 3.0992          |
-| 0.0412        | 62.9344 | 7560 | 3.1126          |
-| 0.0327        | 66.4308 | 7980 | 3.1262          |
-| 0.0391        | 69.9272 | 8400 | 3.1279          |
 ### Framework versions
 - PEFT 0.11.1

 This model is a fine-tuned version of [meta-llama/Meta-Llama-3-8B-Instruct](https://huggingface.co/meta-llama/Meta-Llama-3-8B-Instruct) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- eval_loss: 1.4540
+- eval_runtime: 9.5935
+- eval_samples_per_second: 11.153
+- eval_steps_per_second: 1.459
+- epoch: 1.6649
+- step: 200
 ## Model description
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - lr_scheduler_warmup_ratio: 0.05
+- num_epochs: 3
 - mixed_precision_training: Native AMP
 ### Framework versions
 - PEFT 0.11.1

adapter_config.json CHANGED Viewed

@@ -21,8 +21,7 @@
   "revision": null,
   "target_modules": [
     "v_proj",
-    "q_proj",
-    "k_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "revision": null,
   "target_modules": [
     "v_proj",
+    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c8f5f623b5b1c86000a3a2a6f3b8bc4c7b09b9f4a1d783d2a0e5f90af49fffc9
-size 37774528

 version https://git-lfs.github.com/spec/v1
+oid sha256:6501ee19efb13db3066b3ca3111726396e9848de0f3f2bd951c6365b9f3ee49f
+size 27280152

runs/Jun13_07-27-50_jupiter/events.out.tfevents.1718234875.jupiter.364556.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b5c4fc6d7a3ce71c069a3ea4524470b90fdcc0c4f582787bf75633a50d58dc54
+size 12172

runs/Jun13_07-29-42_jupiter/events.out.tfevents.1718234993.jupiter.364556.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:760c8f0e24619da9f471817ad15bf2b10b8e3b6c88a98d022adc4537cafdcae9
+size 61567

tokenizer.json CHANGED Viewed

@@ -1,6 +1,11 @@
 {
   "version": "1.0",
-  "truncation": null,
   "padding": null,
   "added_tokens": [
     {

 {
   "version": "1.0",
+  "truncation": {
+    "direction": "Right",
+    "max_length": 512,
+    "strategy": "LongestFirst",
+    "stride": 0
+  },
   "padding": null,
   "added_tokens": [
     {

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4c6823eb48bb00e9a133c704981e76d9a75661b5b79220c69f8c03e99234f628
 size 4923

 version https://git-lfs.github.com/spec/v1
+oid sha256:02e896f485718fcc80ba95f42b802371c912c071b6c001915e5ead5020bf9fe6
 size 4923