sparse / ms-swift /tests /infer /test_agent.py
Enxin's picture
Upload folder using huggingface_hub
96fe658 verified
raw
history blame contribute delete
744 Bytes
import os
import torch
os.environ['CUDA_VISIBLE_DEVICES'] = '0'
kwargs = {
'per_device_train_batch_size': 2,
'save_steps': 50,
'gradient_accumulation_steps': 4,
'num_train_epochs': 1,
}
def test_sft():
os.environ['CUDA_VISIBLE_DEVICES'] = '0,1'
from swift.llm import sft_main, TrainArguments, infer_main, InferArguments
sft_main(
TrainArguments(model='Qwen/Qwen2-7B-Instruct', dataset=['iic/ms_agent#2000'], loss_scale='react', **kwargs))
def test_infer():
from swift.llm import infer_main, InferArguments
ckpt_dir = 'output/Qwen2-7B-Instruct/v229-20241126-133152/checkpoint-100'
infer_main(InferArguments(ckpt_dir=ckpt_dir))
if __name__ == '__main__':
test_sft()
# test_infer()