Skip to content

Commit fcce1db

Browse files
committed
fix main
Signed-off-by: Yannick Schnider <[email protected]>
1 parent fb8011a commit fcce1db

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

vllm_spyre/v1/worker/spyre_worker.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@
2929
import vllm_spyre.perf_metrics as perf_metrics
3030
from vllm_spyre.model_executor.model_loader import spyre_setup
3131
from vllm_spyre.platform import SpyrePlatform
32-
from vllm_spyre.v1.worker.spyre_input_batch import InputBatch
32+
from vllm_spyre.v1.worker.spyre_input_batch import SamplingInputBatch
3333
from vllm_spyre.v1.worker.spyre_model_runner import (
3434
ContinuousBatchingSpyreModelRunner, SpyrePoolingModelRunner,
3535
StaticBatchingSpyreModelRunner, SupportedTask)
@@ -329,7 +329,7 @@ def _warmup_spyre_dynamic_size(self, special_token_ids):
329329

330330
# Fix for batch size 1: set input batch to fit 2 requests for warmup
331331
if model_runner.vllm_config.scheduler_config.max_num_seqs == 1:
332-
model_runner.input_batch = InputBatch(
332+
model_runner.input_batch = SamplingInputBatch(
333333
max_num_reqs=2,
334334
max_model_len=model_runner.vllm_config.model_config.
335335
max_model_len,
@@ -388,7 +388,7 @@ def _warmup_spyre_dynamic_size(self, special_token_ids):
388388

389389
# Fix for batch size 1: reset input batch to fit max_num_seqs requests
390390
if model_runner.vllm_config.scheduler_config.max_num_seqs == 1:
391-
model_runner.input_batch = InputBatch(
391+
model_runner.input_batch = SamplingInputBatch(
392392
max_num_reqs=model_runner.vllm_config.scheduler_config.
393393
max_num_seqs,
394394
max_model_len=model_runner.vllm_config.model_config.

0 commit comments

Comments
 (0)