lykeven
/

uptest

Inference Endpoints

Model card Files Files and versions Metrics Training metrics Community

uptest / ptuning /train_chat.sh

lykeven's picture

first model commit

54abf22 over 1 year ago

743 Bytes

	PRE_SEQ_LEN=8
	LR=1e-2

	CUDA_VISIBLE_DEVICES=0 python3 main.py \
	--do_train \
	--train_file $CHAT_TRAIN_DATA \
	--validation_file $CHAT_VAL_DATA \
	--prompt_column prompt \
	--response_column response \
	--history_column history \
	--overwrite_cache \
	--model_name_or_path THUDM/chatglm-6b \
	--output_dir $CHECKPOINT_NAME \
	--overwrite_output_dir \
	--max_source_length 256 \
	--max_target_length 256 \
	--per_device_train_batch_size 1 \
	--per_device_eval_batch_size 1 \
	--gradient_accumulation_steps 16 \
	--predict_with_generate \
	--max_steps 3000 \
	--logging_steps 10 \
	--save_steps 1000 \
	--learning_rate $LR \
	--pre_seq_len $PRE_SEQ_LEN \
	--quantization_bit 4