mistral-lp2-org_org_a

Browse files

Files changed (3) hide show

README.md +20 -20
adapter_config.json +2 -2
adapter_model.safetensors +2 -2

README.md CHANGED Viewed

@@ -16,10 +16,10 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.9110
-- F1 Micro: 0.8214
-- F1 Macro: 0.8156
-- F1 Weighted: 0.8234
 ## Model description
@@ -50,22 +50,22 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch  | Step | Validation Loss | F1 Micro | F1 Macro | F1 Weighted |
 |:-------------:|:------:|:----:|:---------------:|:--------:|:--------:|:-----------:|
-| 1.979         | 0.0154 | 25   | 1.4043          | 0.7220   | 0.7197   | 0.7259      |
-| 1.3006        | 0.0308 | 50   | 1.2184          | 0.7775   | 0.7754   | 0.7807      |
-| 1.1099        | 0.0462 | 75   | 1.1320          | 0.8010   | 0.7970   | 0.8040      |
-| 1.1383        | 0.0615 | 100  | 1.0762          | 0.8039   | 0.8007   | 0.8072      |
-| 1.0121        | 0.0769 | 125  | 1.0230          | 0.8010   | 0.7967   | 0.8037      |
-| 1.0296        | 0.0923 | 150  | 0.9966          | 0.8099   | 0.8056   | 0.8130      |
-| 1.0485        | 0.1077 | 175  | 0.9745          | 0.8111   | 0.8063   | 0.8139      |
-| 0.9996        | 0.1231 | 200  | 0.9647          | 0.8030   | 0.7984   | 0.8052      |
-| 0.9815        | 0.1385 | 225  | 0.9490          | 0.8160   | 0.8099   | 0.8178      |
-| 0.9456        | 0.1538 | 250  | 0.9378          | 0.8073   | 0.8033   | 0.8099      |
-| 0.8896        | 0.1692 | 275  | 0.9298          | 0.8143   | 0.8091   | 0.8164      |
-| 0.994         | 0.1846 | 300  | 0.9239          | 0.8064   | 0.8030   | 0.8094      |
-| 0.8588        | 0.2    | 325  | 0.9142          | 0.8119   | 0.8079   | 0.8145      |
-| 0.8971        | 0.2154 | 350  | 0.9139          | 0.8216   | 0.8158   | 0.8236      |
-| 0.9647        | 0.2308 | 375  | 0.9133          | 0.8223   | 0.8163   | 0.8242      |
-| 0.9352        | 0.2462 | 400  | 0.9110          | 0.8214   | 0.8156   | 0.8234      |
 ### Framework versions

 This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.8643
+- F1 Micro: 0.6606
+- F1 Macro: 0.6479
+- F1 Weighted: 0.6611
 ## Model description
 | Training Loss | Epoch  | Step | Validation Loss | F1 Micro | F1 Macro | F1 Weighted |
 |:-------------:|:------:|:----:|:---------------:|:--------:|:--------:|:-----------:|
+| 1.6117        | 0.0154 | 25   | 1.3679          | 0.5541   | 0.4980   | 0.5313      |
+| 1.2903        | 0.0308 | 50   | 1.2094          | 0.6156   | 0.5779   | 0.6029      |
+| 1.164         | 0.0462 | 75   | 1.0987          | 0.6206   | 0.5931   | 0.6141      |
+| 1.1168        | 0.0615 | 100  | 1.1057          | 0.6376   | 0.5883   | 0.6165      |
+| 1.026         | 0.0769 | 125  | 0.9896          | 0.6314   | 0.6196   | 0.6328      |
+| 0.9481        | 0.0923 | 150  | 0.9619          | 0.6438   | 0.6173   | 0.6373      |
+| 0.9797        | 0.1077 | 175  | 0.9549          | 0.6514   | 0.6191   | 0.6411      |
+| 1.045         | 0.1231 | 200  | 0.9121          | 0.6541   | 0.6403   | 0.6543      |
+| 0.8954        | 0.1385 | 225  | 0.8991          | 0.6595   | 0.6418   | 0.6576      |
+| 0.9245        | 0.1538 | 250  | 0.8887          | 0.6588   | 0.6433   | 0.6580      |
+| 0.8636        | 0.1692 | 275  | 0.8824          | 0.6602   | 0.6458   | 0.6600      |
+| 0.846         | 0.1846 | 300  | 0.8793          | 0.6672   | 0.6451   | 0.6627      |
+| 0.8885        | 0.2    | 325  | 0.8820          | 0.6696   | 0.6431   | 0.6624      |
+| 0.8323        | 0.2154 | 350  | 0.8652          | 0.6618   | 0.6474   | 0.6616      |
+| 0.9313        | 0.2308 | 375  | 0.8654          | 0.6601   | 0.6477   | 0.6608      |
+| 0.857         | 0.2462 | 400  | 0.8643          | 0.6606   | 0.6479   | 0.6611      |
 ### Framework versions

adapter_config.json CHANGED Viewed

@@ -20,9 +20,9 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "k_proj",
-    "q_proj",
     "v_proj",
     "o_proj"
   ],
   "task_type": "SEQ_CLS",

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "v_proj",
+    "q_proj",
+    "k_proj",
     "o_proj"
   ],
   "task_type": "SEQ_CLS",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d287f3e911660a53e7f747ea43f5714abadb39a0ac9ea29328dfffd8e531d587
-size 578898352

 version https://git-lfs.github.com/spec/v1
+oid sha256:0789a908ecfc7cdc60018ed5a135a610ddf9a4edd3e2dc3aebcfb909c83c39fe
+size 578881968