Code quality improvements: version update, type annotation enhancement, and enum usage simplification (#27581)

Signed-off-by: Bradley <bradley.b.pitt@gmail.com>
This commit is contained in:
usberkeley
2025-10-28 01:50:22 +08:00
committed by GitHub
parent 921e78f4bb
commit 69f064062b
3 changed files with 7 additions and 9 deletions

View File

@ -41,11 +41,11 @@ You can add any other [engine-args](../configuration/engine_args.md) you need af
create a custom Dockerfile on top of the base image with an extra layer that installs them:
```Dockerfile
FROM vllm/vllm-openai:v0.9.0
FROM vllm/vllm-openai:v0.11.0
# e.g. install the `audio` optional dependencies
# NOTE: Make sure the version of vLLM matches the base image!
RUN uv pip install --system vllm[audio]==0.9.0
RUN uv pip install --system vllm[audio]==0.11.0
```
!!! tip

View File

@ -368,7 +368,7 @@ class MultiModalProfiler(Generic[_I]):
self,
seq_len: int,
mm_counts: Mapping[str, int] | None = None,
):
) -> Mapping[str, int]:
"""
Returns the maximum length of the multimodal (image placeholders+text)
tokens, including any break/text tokens in-between image embeddings.

View File

@ -113,14 +113,12 @@ class Scheduler(SchedulerInterface):
# req_id -> Request
self.requests: dict[str, Request] = {}
# Scheduling policy
if self.scheduler_config.policy == "priority":
self.policy = SchedulingPolicy.PRIORITY
elif self.scheduler_config.policy == "fcfs":
self.policy = SchedulingPolicy.FCFS
else:
try:
self.policy = SchedulingPolicy(self.scheduler_config.policy)
except ValueError as e:
raise ValueError(
f"Unknown scheduling policy: {self.scheduler_config.policy}"
)
) from e
# Priority queues for requests.
self.waiting = create_request_queue(self.policy)
self.running: list[Request] = []