HuggingFaceUser/adapter-name

Files changed (5) hide show

README.md CHANGED Viewed

@@ -18,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [microsoft/Phi-3.5-mini-instruct](https://huggingface.co/microsoft/Phi-3.5-mini-instruct) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.2347
 ## Model description
@@ -52,16 +52,16 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch  | Step | Validation Loss |
 |:-------------:|:------:|:----:|:---------------:|
-| 1.4504        | 0.2892 | 100  | 1.0898          |
-| 0.8583        | 0.5785 | 200  | 0.6481          |
-| 0.5379        | 0.8677 | 300  | 0.4534          |
-| 0.4042        | 1.1569 | 400  | 0.3593          |
-| 0.335         | 1.4461 | 500  | 0.3093          |
-| 0.2927        | 1.7354 | 600  | 0.2779          |
-| 0.2728        | 2.0246 | 700  | 0.2590          |
-| 0.251         | 2.3138 | 800  | 0.2468          |
-| 0.2374        | 2.6030 | 900  | 0.2388          |
-| 0.236         | 2.8923 | 1000 | 0.2347          |
 ### Framework versions

 This model is a fine-tuned version of [microsoft/Phi-3.5-mini-instruct](https://huggingface.co/microsoft/Phi-3.5-mini-instruct) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.2338
 ## Model description
 | Training Loss | Epoch  | Step | Validation Loss |
 |:-------------:|:------:|:----:|:---------------:|
+| 1.4504        | 0.2892 | 100  | 1.0894          |
+| 0.8508        | 0.5785 | 200  | 0.6406          |
+| 0.5328        | 0.8677 | 300  | 0.4493          |
+| 0.4011        | 1.1569 | 400  | 0.3575          |
+| 0.3328        | 1.4461 | 500  | 0.3085          |
+| 0.291         | 1.7354 | 600  | 0.2769          |
+| 0.2711        | 2.0246 | 700  | 0.2585          |
+| 0.2494        | 2.3138 | 800  | 0.2453          |
+| 0.2361        | 2.6030 | 900  | 0.2378          |
+| 0.2348        | 2.8923 | 1000 | 0.2338          |
 ### Framework versions

adapter_config.json CHANGED Viewed

@@ -21,11 +21,11 @@
   "revision": null,
   "target_modules": [
     "q_proj",
     "o_proj",
     "up_proj",
-    "gate_proj",
     "v_proj",
-    "k_proj",
     "down_proj"
   ],
   "task_type": "CAUSAL_LM",

   "revision": null,
   "target_modules": [
     "q_proj",
+    "k_proj",
+    "gate_proj",
     "o_proj",
     "up_proj",
     "v_proj",
     "down_proj"
   ],
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aa8c3e396f9d65f516404e364ad3e7b5d8708ae8f79de5f1476f923cad8fffa8
 size 35668592

 version https://git-lfs.github.com/spec/v1
+oid sha256:79ba21bef598b7ff38e5b954d50b43531c9e568515c58d1fff239190482e54be
 size 35668592

tokenizer.json CHANGED Viewed

@@ -1,11 +1,6 @@
 {
   "version": "1.0",
-  "truncation": {
-    "direction": "Right",
-    "max_length": 512,
-    "strategy": "LongestFirst",
-    "stride": 0
-  },
   "padding": null,
   "added_tokens": [
     {

 {
   "version": "1.0",
+  "truncation": null,
   "padding": null,
   "added_tokens": [
     {

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:32b70e00533bebcbf93f8152c4c9136a3d95126383957e08baee8354de5dcb14
 size 5496

 version https://git-lfs.github.com/spec/v1
+oid sha256:61922441eeff57590b66cb2f5ced52a2642e7096ba9d81b02421ba0ee8a6020b
 size 5496