add ignore_eos option

vllm-project · youkaichao · Sep 24, 2024 · Sep 16, 2024 · Sep 17, 2024 · Sep 18, 2024
commit da2d815893c1c423073cdf2aac9437787b275009
diff --git a/vllm/entrypoints/llm.py b/vllm/entrypoints/llm.py
@@ -390,6 +390,7 @@ def beam_search(
         prompts: List[Union[str, List[int]]],
         beam_width: int,
         max_tokens: int,
+        ignore_eos: bool = False,
     ) -> List[BeamSearchOutput]:
         """
         Generate sequences using beam search.
@@ -453,7 +454,8 @@ def beam_search(
                                 cum_logprob=current_beam.cum_logprob +
                                 logprob_obj.logprob)
 
-                            if token_id == tokenizer.eos_token_id:
+                            if token_id == tokenizer.eos_token_id and \
+                                not ignore_eos:
                                 instance.completed.append(new_beam)
                             else:
                                 instance_new_beams.append(new_beam)