Training in progress, step 5

Files changed (4) hide show

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "unsloth/Llama-3.2-3B-Instruct",
   "bias": "none",
   "fan_in_fan_out": null,
   "inference_mode": true,
@@ -20,12 +20,12 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "up_proj",
-    "v_proj",
-    "down_proj",
     "gate_proj",
     "k_proj",
-    "o_proj",
     "q_proj"
   ],
   "task_type": "CAUSAL_LM",

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "unsloth/Llama-3.2-1B-Instruct",
   "bias": "none",
   "fan_in_fan_out": null,
   "inference_mode": true,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "o_proj",
     "gate_proj",
     "k_proj",
+    "v_proj",
+    "down_proj",
+    "up_proj",
     "q_proj"
   ],
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c29fe5021e49dba24dd43762b3dadd35d838259e1b435723f03cd3ed35484811
-size 97307544

 version https://git-lfs.github.com/spec/v1
+oid sha256:36d803e3004ea212261d2296d570b2613622bb2d57d19247a0794a0d3a9a27e6
+size 45118424

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "unsloth/Llama-3.2-3B-Instruct",
   "architectures": [
     "LlamaForCausalLM"
   ],
@@ -7,16 +7,16 @@
   "attention_dropout": 0.0,
   "bos_token_id": 128000,
   "eos_token_id": 128009,
-  "head_dim": 128,
   "hidden_act": "silu",
-  "hidden_size": 3072,
   "initializer_range": 0.02,
   "intermediate_size": 8192,
   "max_position_embeddings": 131072,
   "mlp_bias": false,
   "model_type": "llama",
-  "num_attention_heads": 24,
-  "num_hidden_layers": 28,
   "num_key_value_heads": 8,
   "pretraining_tp": 1,
   "quantization_config": {

 {
+  "_name_or_path": "unsloth/Llama-3.2-1B-Instruct",
   "architectures": [
     "LlamaForCausalLM"
   ],
   "attention_dropout": 0.0,
   "bos_token_id": 128000,
   "eos_token_id": 128009,
+  "head_dim": 64,
   "hidden_act": "silu",
+  "hidden_size": 2048,
   "initializer_range": 0.02,
   "intermediate_size": 8192,
   "max_position_embeddings": 131072,
   "mlp_bias": false,
   "model_type": "llama",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 16,
   "num_key_value_heads": 8,
   "pretraining_tp": 1,
   "quantization_config": {

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:149bf676ee240872bdd921fd399e5f04e9da82fac8085640882d9238e1b62f8e
 size 6648

 version https://git-lfs.github.com/spec/v1
+oid sha256:9cd577c5ab87da13d015cd24a6e120ff8a2e22b22b888aace5c91b290baf1e7d
 size 6648