Skip to content

Commit 0d028cc

Browse files
cherry picked PR vllm-project#8870
1 parent 7193774 commit 0d028cc

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

vllm/worker/enc_dec_model_runner.py

+3-1
Original file line numberDiff line numberDiff line change
@@ -268,11 +268,13 @@ def prepare_model_input(
268268
encoder_input_positions=encoder_input_positions_tensor,
269269
)
270270

271+
generators = self.get_generators(finished_requests_ids)
271272
sampling_metadata = SamplingMetadata.prepare(seq_group_metadata_list,
272273
model_input.seq_lens,
273274
model_input.query_lens,
274275
self.device,
275-
self.pin_memory)
276+
self.pin_memory,
277+
generators=generators)
276278
is_prompt = (seq_group_metadata_list[0].is_prompt
277279
if seq_group_metadata_list else None)
278280
return dataclasses.replace(model_input,

0 commit comments

Comments
 (0)