GravityLLM / scripts /train_qlora.sh
lzanardos9's picture
Upload 20 files
b7720f0 verified
raw
history blame contribute delete
480 Bytes
#!/usr/bin/env bash
set -euo pipefail
python train.py \
--model Qwen/Qwen2.5-1.5B-Instruct \
--train_file data/train.jsonl \
--valid_file data/valid.jsonl \
--output_dir outputs/GravityLLM-Qwen2.5-1.5B-S9 \
--max_length 2048 \
--num_train_epochs 3 \
--learning_rate 2e-4 \
--train_batch_size 1 \
--eval_batch_size 1 \
--gradient_accumulation_steps 16 \
--warmup_ratio 0.03 \
--logging_steps 10 \
--save_steps 100 \
--eval_steps 100 \
--qlora --bf16