diff --git a/qwen2_5_Instruct_model_predict_vllm_1.py b/qwen2_5_Instruct_model_predict_vllm_1.py index 5d26fbd..7060149 100644 --- a/qwen2_5_Instruct_model_predict_vllm_1.py +++ b/qwen2_5_Instruct_model_predict_vllm_1.py @@ -162,7 +162,7 @@ def classify(batch_size): # 调用模型,设置最大batch_size sampling_params_list.append(SamplingParams( temperature=temperature, top_p=top_p, - stop="<|end|>", + stop="<|im_end|>", presence_penalty=presence_penalty, max_tokens=max_tokens )) diff --git a/qwen2_5_Instruct_model_predict_vllm_2.py b/qwen2_5_Instruct_model_predict_vllm_2.py index 65279a2..2273adf 100644 --- a/qwen2_5_Instruct_model_predict_vllm_2.py +++ b/qwen2_5_Instruct_model_predict_vllm_2.py @@ -162,7 +162,7 @@ def classify(batch_size): # 调用模型,设置最大batch_size sampling_params_list.append(SamplingParams( temperature=temperature, top_p=top_p, - stop="<|end|>", + stop="<|im_end|>", presence_penalty=presence_penalty, max_tokens=max_tokens )) diff --git a/qwen2_5_Instruct_model_predict_vllm_3.py b/qwen2_5_Instruct_model_predict_vllm_3.py index 27a8a43..2a21635 100644 --- a/qwen2_5_Instruct_model_predict_vllm_3.py +++ b/qwen2_5_Instruct_model_predict_vllm_3.py @@ -162,7 +162,7 @@ def classify(batch_size): # 调用模型,设置最大batch_size sampling_params_list.append(SamplingParams( temperature=temperature, top_p=top_p, - stop="<|end|>", + stop="<|im_end|>", presence_penalty=presence_penalty, max_tokens=max_tokens ))