diff --git a/vllm/engine/llm_engine.py b/vllm/engine/llm_engine.py index 835803fd..4caecb8a 100644 --- a/vllm/engine/llm_engine.py +++ b/vllm/engine/llm_engine.py @@ -8,7 +8,8 @@ from vllm.config import (CacheConfig, DecodingConfig, DeviceConfig, LoadConfig, LoRAConfig, ModelConfig, ParallelConfig, SchedulerConfig, SpeculativeConfig, VisionLanguageConfig) -from vllm.core.scheduler import Scheduler, SchedulerOutputs +from vllm.core.scheduler import (ScheduledSequenceGroup, Scheduler, + SchedulerOutputs) from vllm.engine.arg_utils import EngineArgs from vllm.engine.metrics import StatLogger, Stats from vllm.engine.output_processor.interfaces import ( @@ -485,7 +486,7 @@ class LLMEngine: def _process_model_outputs( self, output: List[SamplerOutput], - scheduled_seq_groups: List[SequenceGroup], + scheduled_seq_groups: List[ScheduledSequenceGroup], ignored_seq_groups: List[SequenceGroup], seq_group_metadata_list: List[SequenceGroupMetadata], ) -> List[RequestOutput]: