\# NOTE(woosuk): The persistent batch optimization assumes that
\# consecutive batches contain mostly the same requests. If batches
\# have low request overlap (e.g., alternating between two distinct
\# sets of requests), this optimization becomes very inefficient.
for req_id in unscheduled_req_ids:
self.input_batch.remove_request(req_id)