End of training

Browse files

Files changed (6) hide show

README.md +26 -26
adapter_config.json +1 -1
adapter_model.safetensors +1 -1
emissions.csv +1 -1
runs/Jul17_21-38-32_msc-modeltrain-pod/events.out.tfevents.1721252316.msc-modeltrain-pod.4064.0 +3 -0
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [meta-llama/Meta-Llama-3-8B](https://huggingface.co/meta-llama/Meta-Llama-3-8B) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.7284
 ## Model description
@@ -64,31 +64,31 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 3.7573        | 1.36  | 10   | 3.3722          |
-| 2.8144        | 2.71  | 20   | 2.0325          |
-| 1.5867        | 4.07  | 30   | 1.2586          |
-| 1.1875        | 5.42  | 40   | 1.0898          |
-| 1.0487        | 6.78  | 50   | 1.0168          |
-| 0.9716        | 8.14  | 60   | 0.9688          |
-| 0.9134        | 9.49  | 70   | 0.9304          |
-| 0.8505        | 10.85 | 80   | 0.8940          |
-| 0.7963        | 12.2  | 90   | 0.8640          |
-| 0.7497        | 13.56 | 100  | 0.8379          |
-| 0.7067        | 14.92 | 110  | 0.8080          |
-| 0.6484        | 16.27 | 120  | 0.7751          |
-| 0.5945        | 17.63 | 130  | 0.7385          |
-| 0.5349        | 18.98 | 140  | 0.6990          |
-| 0.4854        | 20.34 | 150  | 0.6956          |
-| 0.4729        | 21.69 | 160  | 0.6990          |
-| 0.4496        | 23.05 | 170  | 0.6885          |
-| 0.4405        | 24.41 | 180  | 0.7089          |
-| 0.435         | 25.76 | 190  | 0.7215          |
-| 0.4243        | 27.12 | 200  | 0.7162          |
-| 0.418         | 28.47 | 210  | 0.7205          |
-| 0.4156        | 29.83 | 220  | 0.7296          |
-| 0.4153        | 31.19 | 230  | 0.7275          |
-| 0.4146        | 32.54 | 240  | 0.7292          |
-| 0.4094        | 33.9  | 250  | 0.7284          |
 ### Framework versions

 This model is a fine-tuned version of [meta-llama/Meta-Llama-3-8B](https://huggingface.co/meta-llama/Meta-Llama-3-8B) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.7698
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 3.7636        | 1.36  | 10   | 3.3566          |
+| 2.8254        | 2.71  | 20   | 2.0280          |
+| 1.5642        | 4.07  | 30   | 1.2681          |
+| 1.1877        | 5.42  | 40   | 1.1017          |
+| 1.0503        | 6.78  | 50   | 1.0240          |
+| 0.9732        | 8.14  | 60   | 0.9786          |
+| 0.9065        | 9.49  | 70   | 0.9394          |
+| 0.8513        | 10.85 | 80   | 0.9004          |
+| 0.7914        | 12.2  | 90   | 0.8791          |
+| 0.7408        | 13.56 | 100  | 0.8509          |
+| 0.6882        | 14.92 | 110  | 0.8191          |
+| 0.6389        | 16.27 | 120  | 0.7877          |
+| 0.5855        | 17.63 | 130  | 0.7748          |
+| 0.5293        | 18.98 | 140  | 0.7502          |
+| 0.4876        | 20.34 | 150  | 0.7337          |
+| 0.4619        | 21.69 | 160  | 0.7275          |
+| 0.4458        | 23.05 | 170  | 0.7315          |
+| 0.4287        | 24.41 | 180  | 0.7475          |
+| 0.434         | 25.76 | 190  | 0.7489          |
+| 0.4186        | 27.12 | 200  | 0.7573          |
+| 0.4158        | 28.47 | 210  | 0.7618          |
+| 0.4105        | 29.83 | 220  | 0.7719          |
+| 0.4039        | 31.19 | 230  | 0.7677          |
+| 0.4087        | 32.54 | 240  | 0.7692          |
+| 0.4078        | 33.9  | 250  | 0.7698          |
 ### Framework versions

adapter_config.json CHANGED Viewed

@@ -8,7 +8,7 @@
   "layers_pattern": null,
   "layers_to_transform": null,
   "lora_alpha": 64,
-  "lora_dropout": 0.2,
   "modules_to_save": null,
   "peft_type": "LORA",
   "r": 32,

   "layers_pattern": null,
   "layers_to_transform": null,
   "lora_alpha": 64,
+  "lora_dropout": 0.3,
   "modules_to_save": null,
   "peft_type": "LORA",
   "r": 32,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dcd4cce18bd06fc14145a73cf25cd3cab8a326057bc4fba56c7d5e68c2670d70
 size 75523312

 version https://git-lfs.github.com/spec/v1
+oid sha256:2396fd1095bb4c7827c0b91569b26ee5a0da7c1bc67d4316e1ed3125d0412e8c
 size 75523312

emissions.csv CHANGED Viewed

	@@ -1,2 +1,2 @@
1	timestamp,experiment_id,project_name,duration,emissions,energy_consumed,country_name,country_iso_code,region,on_cloud,cloud_provider,cloud_region
2	- 2024-07-~~17T21~~:26:16,~~875bb1fb~~-~~55b3~~-~~4654~~-~~806d~~-~~76f2ddaca959~~,codecarbon,~~1335~~.~~8051824569702~~,0.~~07996877307198384~~,0.~~1189818413677245~~,United Kingdom,GBR,scotland,N,,


1	timestamp,experiment_id,project_name,duration,emissions,energy_consumed,country_name,country_iso_code,region,on_cloud,cloud_provider,cloud_region
2	+ 2024-07-17T22:00:54,d57424a2-3051-45e7-aa21-4122e466d370,codecarbon,1337.6511194705963,0.0797943164549178,0.11872227543042274,United Kingdom,GBR,scotland,N,,

runs/Jul17_21-38-32_msc-modeltrain-pod/events.out.tfevents.1721252316.msc-modeltrain-pod.4064.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a499cb40b2ffb68fb419ee2947907e88110548e71bc461625835eda838a3b37a
+size 17467

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1f116e75b2c681e3d8ef6631a40874a06edfdccef281260daae484fdda3bebfd
 size 4984

 version https://git-lfs.github.com/spec/v1
+oid sha256:7c5748d207260224e60fd82bd6da0e65c6d55013cba7f3cac16494bfcf932da6
 size 4984