CUDA_VISIBLE_DEVICES=2,3 python src/train_sft.py \ --model_name_or_path /home/majiahui/models-LLM/baichuan-7B \ --do_train \ --dataset paper_data_v3_prompt \ --dataset_dir /home/majiahui/project2/LLaMA-Efficient-Tuning/data \ --finetuning_type freeze \ --max_source_length 700 \ --max_target_length 1400 \ --output_dir path_to_sft_checkpoint_paper_prompt_freeze_baichuan \ --overwrite_cache \ --per_device_train_batch_size 1 \ --gradient_accumulation_steps 1 \ --lr_scheduler_type cosine \ --logging_steps 10 \ --save_steps 1000 \ --learning_rate 5e-5 \ --num_train_epochs 3.0 \ --plot_loss \ --fp16