q1e123
/

peft-starcoder-lora-a100

q1e123 commited on May 21, 2024

Commit

6f61019

verified ·

1 Parent(s): f85870f

Model save

Files changed (3) hide show

README.md CHANGED Viewed

@@ -3,7 +3,7 @@ license: apache-2.0
 library_name: peft
 tags:
 - generated_from_trainer
-base_model: distilgpt2
 model-index:
 - name: peft-starcoder-lora-a100
   results: []
@@ -14,7 +14,7 @@ should probably proofread and complete it, then remove this comment. -->
 # peft-starcoder-lora-a100
-This model is a fine-tuned version of [distilgpt2](https://huggingface.co/distilgpt2) on an unknown dataset.
 ## Model description

 library_name: peft
 tags:
 - generated_from_trainer
+base_model: distilbert/distilgpt2
 model-index:
 - name: peft-starcoder-lora-a100
   results: []
 # peft-starcoder-lora-a100
+This model is a fine-tuned version of [distilbert/distilgpt2](https://huggingface.co/distilbert/distilgpt2) on an unknown dataset.
 ## Model description

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "distilgpt2",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -20,30 +20,30 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "transformer.h.3.attn.c_proj",
-    "transformer.h.3.mlp.c_fc",
-    "transformer.h.5.mlp.c_fc",
-    "transformer.h.4.mlp.c_fc",
-    "transformer.h.2.mlp.c_proj",
-    "transformer.h.0.mlp.c_proj",
-    "transformer.h.4.attn.c_proj",
-    "transformer.h.3.mlp.c_proj",
     "transformer.h.4.attn.c_attn",
-    "transformer.h.4.mlp.c_proj",
-    "transformer.h.3.attn.c_attn",
     "transformer.h.1.attn.c_attn",
-    "transformer.h.0.attn.c_attn",
-    "transformer.h.1.attn.c_proj",
     "transformer.h.1.mlp.c_proj",
-    "transformer.h.5.mlp.c_proj",
     "transformer.h.2.attn.c_proj",
-    "transformer.h.5.attn.c_attn",
     "transformer.h.0.mlp.c_fc",
-    "transformer.h.0.attn.c_proj",
-    "transformer.h.2.mlp.c_fc",
     "transformer.h.2.attn.c_attn",
-    "transformer.h.5.attn.c_proj",
-    "transformer.h.1.mlp.c_fc"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "distilbert/distilgpt2",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "transformer.h.4.attn.c_attn",
+    "transformer.h.5.attn.c_attn",
+    "transformer.h.4.attn.c_proj",
     "transformer.h.1.attn.c_attn",
+    "transformer.h.2.mlp.c_proj",
     "transformer.h.1.mlp.c_proj",
+    "transformer.h.4.mlp.c_proj",
+    "transformer.h.3.attn.c_proj",
+    "transformer.h.4.mlp.c_fc",
+    "transformer.h.5.attn.c_proj",
+    "transformer.h.0.attn.c_proj",
+    "transformer.h.3.attn.c_attn",
     "transformer.h.2.attn.c_proj",
     "transformer.h.0.mlp.c_fc",
     "transformer.h.2.attn.c_attn",
+    "transformer.h.0.mlp.c_proj",
+    "transformer.h.1.attn.c_proj",
+    "transformer.h.5.mlp.c_fc",
+    "transformer.h.3.mlp.c_fc",
+    "transformer.h.1.mlp.c_fc",
+    "transformer.h.3.mlp.c_proj",
+    "transformer.h.0.attn.c_attn",
+    "transformer.h.5.mlp.c_proj",
+    "transformer.h.2.mlp.c_fc"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:905022d7425bfab0d74e1dc861298969f9c63ef170520ac60873a866360e5cff
 size 5112

 version https://git-lfs.github.com/spec/v1
+oid sha256:1e5f0f0ada0564f9402e4b8399d0f7dce549cebc056ce5b9a9b91edac79b2585
 size 5112