Skip to content

Commit

Permalink
clear prefill metadata
Browse files Browse the repository at this point in the history
  • Loading branch information
Varun Sundar Rabindranath committed Sep 17, 2024
1 parent 427ef77 commit 0ffa5fd
Showing 1 changed file with 3 additions and 2 deletions.
5 changes: 3 additions & 2 deletions vllm/worker/multi_step_worker.py
Original file line number Diff line number Diff line change
Expand Up @@ -76,8 +76,9 @@ def _get_driver_input_and_broadcast(
frozen_model_input = model_input.frozen_model_input
assert frozen_model_input is not None
assert frozen_model_input.attn_metadata is not None
# clear the cached decode metadata so that it can be recomputed on
# the workers
# clear the cached metadata so that it can be recomputed on
# the workers.
frozen_model_input.attn_metadata._cached_prefill_metadata = None
frozen_model_input.attn_metadata._cached_decode_metadata = None

model_input.is_first_multi_step = is_first_multi_step
Expand Down

0 comments on commit 0ffa5fd

Please sign in to comment.