We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent dc23fb5 commit 9944bbfCopy full SHA for 9944bbf
1 file changed
python/sglang/srt/disaggregation/prefill.py
@@ -226,6 +226,11 @@ def process_disagg_prefill_inflight_queue(self: Scheduler) -> None:
226
elif poll == KVPoll.Failed:
227
raise Exception("Transferring failed")
228
229
+ for req in done_reqs:
230
+ self.disagg_prefill_pending_queue.req_to_metadata_buffer_idx_allocator.free(
231
+ req.metadata_buffer_index
232
+ )
233
+
234
# Stream requests which have finished transfer
235
self.stream_output(done_reqs, False, None)
236
0 commit comments