| import os | |
| import torch | |
| os.environ['CUDA_VISIBLE_DEVICES'] = '0' | |
| kwargs = { | |
| 'per_device_train_batch_size': 2, | |
| 'save_steps': 50, | |
| 'gradient_accumulation_steps': 4, | |
| 'num_train_epochs': 1, | |
| } | |
| def test_sft(): | |
| os.environ['CUDA_VISIBLE_DEVICES'] = '0,1' | |
| from swift.llm import sft_main, TrainArguments, infer_main, InferArguments | |
| sft_main( | |
| TrainArguments(model='Qwen/Qwen2-7B-Instruct', dataset=['iic/ms_agent#2000'], loss_scale='react', **kwargs)) | |
| def test_infer(): | |
| from swift.llm import infer_main, InferArguments | |
| ckpt_dir = 'output/Qwen2-7B-Instruct/v229-20241126-133152/checkpoint-100' | |
| infer_main(InferArguments(ckpt_dir=ckpt_dir)) | |
| if __name__ == '__main__': | |
| test_sft() | |
| # test_infer() | |