diff --git a/llm/predict/predictor.py b/llm/predict/predictor.py index 84b9ff62bb55..cc8250862e04 100644 --- a/llm/predict/predictor.py +++ b/llm/predict/predictor.py @@ -1567,7 +1567,7 @@ def send_task_to_queue(task_id): else: if flag_current_rank_run: output_tokens = self.model_inputs["all_token_ids"].numpy() - output_tokens[output_tokens < 0] = self.tokenizer.pad_token_id + output_tokens[output_tokens == -1] = self.tokenizer.eos_token_id if detokenize: outputs = self.tokenizer.batch_decode( output_tokens, skip_special_tokens=True, clean_up_tokenization_spaces=False