We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 7193774 commit 0d028ccCopy full SHA for 0d028cc
vllm/worker/enc_dec_model_runner.py
@@ -268,11 +268,13 @@ def prepare_model_input(
268
encoder_input_positions=encoder_input_positions_tensor,
269
)
270
271
+ generators = self.get_generators(finished_requests_ids)
272
sampling_metadata = SamplingMetadata.prepare(seq_group_metadata_list,
273
model_input.seq_lens,
274
model_input.query_lens,
275
self.device,
- self.pin_memory)
276
+ self.pin_memory,
277
+ generators=generators)
278
is_prompt = (seq_group_metadata_list[0].is_prompt
279
if seq_group_metadata_list else None)
280
return dataclasses.replace(model_input,
0 commit comments