llama2-stock-model

Browse files

Files changed (4) hide show

README.md +25 -26
adapter_config.json +7 -7
adapter_model.safetensors +2 -2
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -1,9 +1,8 @@
 ---
-license: apache-2.0
 library_name: peft
 tags:
 - generated_from_trainer
-base_model: mistralai/Mistral-7B-v0.1
 model-index:
 - name: mistral-stock-finetune
   results: []
@@ -14,9 +13,9 @@ should probably proofread and complete it, then remove this comment. -->
 # mistral-stock-finetune
-This model is a fine-tuned version of [mistralai/Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.6006
 ## Model description
@@ -48,32 +47,32 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 0.957         | 0.07  | 25   | 0.7369          |
-| 0.6947        | 0.13  | 50   | 0.6830          |
-| 0.68          | 0.2   | 75   | 0.6631          |
-| 0.6596        | 0.26  | 100  | 0.6512          |
-| 0.655         | 0.33  | 125  | 0.6424          |
-| 0.6355        | 0.4   | 150  | 0.6344          |
-| 0.6434        | 0.46  | 175  | 0.6297          |
-| 0.6307        | 0.53  | 200  | 0.6252          |
-| 0.6224        | 0.59  | 225  | 0.6215          |
-| 0.6128        | 0.66  | 250  | 0.6177          |
-| 0.6018        | 0.73  | 275  | 0.6148          |
-| 0.62          | 0.79  | 300  | 0.6118          |
-| 0.5959        | 0.86  | 325  | 0.6093          |
-| 0.6046        | 0.92  | 350  | 0.6062          |
-| 0.6062        | 0.99  | 375  | 0.6038          |
-| 0.5769        | 1.06  | 400  | 0.6053          |
-| 0.559         | 1.12  | 425  | 0.6027          |
-| 0.5599        | 1.19  | 450  | 0.6021          |
-| 0.5522        | 1.25  | 475  | 0.6010          |
-| 0.5547        | 1.32  | 500  | 0.6006          |
 ### Framework versions
-- PEFT 0.9.1.dev0
-- Transformers 4.39.0.dev0
 - Pytorch 2.1.0+cu118
 - Datasets 2.18.0
 - Tokenizers 0.15.2

 ---
 library_name: peft
 tags:
 - generated_from_trainer
+base_model: meta-llama/Llama-2-7b-hf
 model-index:
 - name: mistral-stock-finetune
   results: []
 # mistral-stock-finetune
+This model is a fine-tuned version of [meta-llama/Llama-2-7b-hf](https://huggingface.co/meta-llama/Llama-2-7b-hf) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.6325
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 1.2624        | 0.07  | 25   | 1.0074          |
+| 0.8582        | 0.13  | 50   | 0.7799          |
+| 0.7578        | 0.2   | 75   | 0.7358          |
+| 0.7276        | 0.26  | 100  | 0.7133          |
+| 0.7104        | 0.33  | 125  | 0.6944          |
+| 0.6791        | 0.4   | 150  | 0.6819          |
+| 0.6856        | 0.46  | 175  | 0.6734          |
+| 0.6723        | 0.53  | 200  | 0.6658          |
+| 0.6629        | 0.59  | 225  | 0.6601          |
+| 0.6526        | 0.66  | 250  | 0.6553          |
+| 0.6395        | 0.73  | 275  | 0.6505          |
+| 0.6537        | 0.79  | 300  | 0.6471          |
+| 0.6317        | 0.86  | 325  | 0.6445          |
+| 0.6401        | 0.92  | 350  | 0.6405          |
+| 0.6412        | 0.99  | 375  | 0.6375          |
+| 0.6303        | 1.06  | 400  | 0.6367          |
+| 0.6135        | 1.12  | 425  | 0.6347          |
+| 0.6107        | 1.19  | 450  | 0.6336          |
+| 0.605         | 1.25  | 475  | 0.6330          |
+| 0.6062        | 1.32  | 500  | 0.6325          |
 ### Framework versions
+- PEFT 0.10.1.dev0
+- Transformers 4.40.0.dev0
 - Pytorch 2.1.0+cu118
 - Datasets 2.18.0
 - Tokenizers 0.15.2

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "mistralai/Mistral-7B-v0.1",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -20,14 +20,14 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "down_proj",
-    "gate_proj",
-    "o_proj",
-    "lm_head",
     "v_proj",
     "k_proj",
-    "up_proj",
-    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "meta-llama/Llama-2-7b-hf",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "q_proj",
     "v_proj",
+    "lm_head",
     "k_proj",
+    "gate_proj",
+    "down_proj",
+    "o_proj",
+    "up_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f260341af3c5a3501294d86b879fd6192a4d48ec0d5890f7c1fcda0552188efc
-size 864513616

 version https://git-lfs.github.com/spec/v1
+oid sha256:d02672009795a2cd99351b015eb1c026bdbd67ac8423f45150be12301ed7e2f4
+size 848784976

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0464207dc4a228aa156dd4e77277109ec5004f3b6b6769521b8ccb6ec50733bb
 size 4920

 version https://git-lfs.github.com/spec/v1
+oid sha256:2053d1b83f9224c5a19a46603617d2eed3093575944f8849a1d202cf2b94090b
 size 4920