We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c650320 commit 3b67ae0Copy full SHA for 3b67ae0
vllm_spyre/worker/spyre_model_runner.py
@@ -284,7 +284,10 @@ def prepare_model_input(
284
# updating indices: set indices of newly finished sequences False
285
if finished_requests_ids:
286
for seq_id in finished_requests_ids:
287
- self.model.indices[self._req_ids2idx[seq_id]] = False
+ # ignore requests that are not in the batch, eg. requests
288
+ # cancelled while waiting
289
+ if idx := self._req_ids2idx.get(seq_id):
290
+ self.model.indices[idx] = False
291
(input_tokens, input_positions,
292
input_masks) = self._prepare_decode(seq_group_metadata_list)
293
seq_lens = []
0 commit comments