Training in progress, step 200

Files changed (7) hide show

adapter_config.json CHANGED Viewed

@@ -9,13 +9,13 @@
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
-  "lora_alpha": 16,
   "lora_dropout": 0.05,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
-  "r": 8,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [

   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
+  "lora_alpha": 32,
   "lora_dropout": 0.05,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
+  "r": 16,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:219ec5f4314d4b3a5aecfdaffc318888edf58a347fd1f4d32025dabf899ee152
-size 8405600

 version https://git-lfs.github.com/spec/v1
+oid sha256:c38c2abdfca3b929c12ab474d22007c5a8dbc1e39d0928966714fdc36feeadfd
+size 16794456

angle.config CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "model_name_or_path": "NousResearch/Llama-2-7b-hf",
-  "max_length": 85,
   "model_kwargs": {},
   "pooling_strategy": "cls",
   "lora_config_kwargs": {
     "task_type": "CAUSAL_LM",
-    "r": 8,
-    "lora_alpha": 16,
     "lora_dropout": 0.05,
     "bias": "none"
   },

 {
   "model_name_or_path": "NousResearch/Llama-2-7b-hf",
+  "max_length": 80,
   "model_kwargs": {},
   "pooling_strategy": "cls",
   "lora_config_kwargs": {
     "task_type": "CAUSAL_LM",
+    "r": 16,
+    "lora_alpha": 32,
     "lora_dropout": 0.05,
     "bias": "none"
   },

runs/Apr07_09-45-24_instance-20240226-074643/events.out.tfevents.1712483135.instance-20240226-074643.1028754.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c570271218c3ae829306367fa885f08352af334ed3fcd519601e892638d1ba6a
-size 14954

 version https://git-lfs.github.com/spec/v1
+oid sha256:e42a2d055594d758a3e5fc29a06091c71406f518af7f6859aeb1b852bc35b2f4
+size 15308

runs/Apr07_10-49-45_instance-20240226-074643/events.out.tfevents.1712487001.instance-20240226-074643.1056587.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:cbafd3541014df5974b521b3a0a4db8dcdcb172c176decc0ce5ec744668e9620
+size 5459

runs/Apr07_10-54-47_instance-20240226-074643/events.out.tfevents.1712487297.instance-20240226-074643.1068449.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:593ffb26a222b94912356903b05541a021da32f74a2a3a43c45b4ab39262d899
+size 5248

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6db33d706f52b48b673761422b942d830dcc688166c0018b7e5be347b77c25d6
 size 5048

 version https://git-lfs.github.com/spec/v1
+oid sha256:fdf217563738fa69d3a9c66dcdbd1f1b153e692ca31ae94436a1183ca3c5553f
 size 5048