Skip to content

Commit

Permalink
cherry picked PR vllm-project#8870
Browse files Browse the repository at this point in the history
  • Loading branch information
tripathiarpan20 committed Oct 2, 2024
1 parent 7193774 commit 0d028cc
Showing 1 changed file with 3 additions and 1 deletion.
4 changes: 3 additions & 1 deletion vllm/worker/enc_dec_model_runner.py
Original file line number Diff line number Diff line change
Expand Up @@ -268,11 +268,13 @@ def prepare_model_input(
encoder_input_positions=encoder_input_positions_tensor,
)

generators = self.get_generators(finished_requests_ids)
sampling_metadata = SamplingMetadata.prepare(seq_group_metadata_list,
model_input.seq_lens,
model_input.query_lens,
self.device,
self.pin_memory)
self.pin_memory,
generators=generators)
is_prompt = (seq_group_metadata_list[0].is_prompt
if seq_group_metadata_list else None)
return dataclasses.replace(model_input,
Expand Down

0 comments on commit 0d028cc

Please sign in to comment.