Surya1523
/

healthbot

text-generation-inference

Model card Files Files and versions

Surya1523 commited on Apr 16

Commit

8069f55

·

verified ·

1 Parent(s): 1cdb179

Create config.json

Files changed (1) hide show

config.json +47 -0

config.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "model_name": "unsloth/Phi-3-mini-4k-instruct",
+    "model_type": "phi-3",
+  "max_seq_length": 2048,
+  "load_in_4bit": true,
+  "lora_config": {
+    "r": 16,
+    "lora_alpha": 16,
+    "target_modules": [
+      "q_proj",
+      "k_proj",
+      "v_proj",
+      "o_proj",
+      "gate_proj",
+      "up_proj",
+      "down_proj"
+    ],
+    "lora_dropout": 0,
+    "bias": "none",
+    "use_gradient_checkpointing": "unsloth",
+    "random_state": 3407,
+    "use_rslora": false,
+    "loftq_config": null
+  },
+  "training_arguments": {
+    "per_device_train_batch_size": 2,
+    "gradient_accumulation_steps": 4,
+    "warmup_steps": 5,
+    "max_steps": 60,
+    "learning_rate": 2e-4,
+    "fp16": true,
+    "bf16": false,
+    "logging_steps": 1,
+    "optim": "adamw_8bit",
+    "weight_decay": 0.01,
+    "lr_scheduler_type": "linear",
+    "seed": 3407,
+    "output_dir": "outputs"
+  },
+  "data_config": {
+    "dataset_text_field": "text",
+    "max_seq_length": 2048,
+    "dataset_num_proc": 2,
+    "packing": false
+  }
+}