burtenshaw
/

Qwen1.5-0.5B-dpo-mix-7k-3000

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

Qwen1.5-0.5B-dpo-mix-7k-3000 / runpod.sh

burtenshaw's picture

burtenshaw HF staff

Upload folder using huggingface_hub

4ad32d0 verified 8 months ago

859 Bytes

	pip install datasets accelerate wandb transformers bitsandbytes sentencepiece
	git clone https://github.com/burtenshaw/orpo.git
	cd orpo
	sed -i 's/num_processes: 2/num_processes: 1/' ./src/accelerate/fsdp.yaml
	sed -i 's/--num_proc", default=8/--num_proc", default=1/' ./src/args.py
	wandb login $WANDB_TOKEN
	wandb init -p $WANDB_PROJECT
	accelerate launch --config_file ./src/accelerate/fsdp.yaml main.py \
	--lr $LEARNING_RATE \
	--warmup_steps 100 \
	--model_name $MODEL_ID \
	--data_name $DATASET \
	--num_train_epochs $EPOCH \
	--max_samples $MAX_SAMPLES \
	--prompt_max_length 128 \
	--response_max_length 2048 \
	--per_device_train_batch_size 4 \
	--per_device_eval_batch_size 4 \
	--gradient_accumulation_steps 1 \
	--num_proc 1
	cd $OUTPUT
	cd */
	huggingface-cli login --token $TOKEN
	huggingface-cli upload $NEW_MODEL . .