We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
end_forward
1 parent 79d7d66 commit 95f3845Copy full SHA for 95f3845
vllm/attention/backends/flashinfer.py
@@ -126,6 +126,7 @@ def begin_forward(self):
126
self.paged_kv_indptr = self.paged_kv_indptr.to(self.device)
127
self.paged_kv_last_page_len = self.paged_kv_last_page_len.to(
128
self.device)
129
+ self.prefill_wrapper.end_forward()
130
self.prefill_wrapper.begin_forward(
131
self.query_start_loc, self.paged_kv_indptr,
132
self.paged_kv_indices, self.paged_kv_last_page_len,
@@ -142,6 +143,7 @@ def begin_forward(self):
142
143
144
145
assert self.decode_wrapper is not None
146
+ self.decode_wrapper.end_forward()
147
self.decode_wrapper.begin_forward(
148
self.paged_kv_indptr,
149
self.paged_kv_indices,
0 commit comments