Training in progress, step 100

Files changed (6) hide show

adapter_config.json CHANGED Viewed

@@ -19,12 +19,12 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "q_proj",
     "k_proj",
-    "up_proj",
     "v_proj",
     "o_proj",
-    "down_proj",
     "gate_proj"
   ],
   "task_type": "CAUSAL_LM",

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "down_proj",
     "k_proj",
     "v_proj",
     "o_proj",
+    "up_proj",
+    "q_proj",
     "gate_proj"
   ],
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b605b4dec6f41fef22a7f56fcf6dc58ae13c4cef1f7dc1041108e6713b99357
 size 639691872

 version https://git-lfs.github.com/spec/v1
+oid sha256:74a7a13cdfda33d6dc51f1de17c77c4219c3c95b0690e7f0f54b1e7e88597d47
 size 639691872

angle.config CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "model_name_or_path": "NousResearch/Llama-2-7b-hf",
-  "max_length": 85,
   "model_kwargs": {},
   "pooling_strategy": "cls",
   "lora_config_kwargs": {
@@ -11,12 +11,12 @@
     "bias": "none",
     "target_modules": [
       "q_proj",
-      "k_proj",
       "up_proj",
       "v_proj",
-      "o_proj",
-      "down_proj",
-      "gate_proj"
     ]
   },
   "apply_lora": 1

 {
   "model_name_or_path": "NousResearch/Llama-2-7b-hf",
+  "max_length": 75,
   "model_kwargs": {},
   "pooling_strategy": "cls",
   "lora_config_kwargs": {
     "bias": "none",
     "target_modules": [
       "q_proj",
+      "o_proj",
       "up_proj",
       "v_proj",
+      "gate_proj",
+      "k_proj",
+      "down_proj"
     ]
   },
   "apply_lora": 1

runs/Mar21_01-43-18_instance-20240226-074643/events.out.tfevents.1710985403.instance-20240226-074643.2250503.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aeb3144f81c5f6fba72dcbb81588c8bbc2394e5bdd59eff2ae88a4a6ad25016c
-size 14275

 version https://git-lfs.github.com/spec/v1
+oid sha256:6078f886b6854166aca865f86b5d4e8ab5d936b1401f3678584e892436ee3462
+size 14840

runs/Mar22_13-13-14_instance-20240226-074643/events.out.tfevents.1711113203.instance-20240226-074643.3260260.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:afa993ea1d223a53dba00ab4673039a7ec430096605fe93abc8fb0b6295cc9f2
+size 5413

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dc11b5306294f493aeddcb98df863a108e665e74ac0e48b5ef03627c24e7875b
 size 5048

 version https://git-lfs.github.com/spec/v1
+oid sha256:8683f1534b803565058f488cf02c4891f4edbcb2b2895ce55448900b3cb5d972
 size 5048