diff --git a/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_connector.py b/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_connector.py index 7232d94703..a5240adab4 100644 --- a/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_connector.py +++ b/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_connector.py @@ -13,6 +13,9 @@ from vllm.distributed.kv_transfer.kv_connector.v1.base import ( KVConnectorMetadata, KVConnectorRole, ) +from vllm.distributed.kv_transfer.kv_connector.v1.lmcache_integration import ( + vllm_v1_adapter as _adapter, +) from vllm.logger import init_logger from vllm.v1.core.sched.output import SchedulerOutput @@ -34,11 +37,6 @@ class LMCacheConnectorV1(KVConnectorBase_V1): ) if use_native: logger.info("Initializing native LMCache connector") - # lazy import - from vllm.distributed.kv_transfer.kv_connector.v1 import lmcache_integration - - _adapter = lmcache_integration.vllm_v1_adapter - cls = _adapter.LMCacheConnectorV1Impl else: logger.info("Initializing latest dev LMCache connector") diff --git a/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/__init__.py b/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/__init__.py index 3c73a1c09e..208f01a7cb 100644 --- a/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/__init__.py +++ b/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/__init__.py @@ -1,7 +1,2 @@ # SPDX-License-Identifier: Apache-2.0 # SPDX-FileCopyrightText: Copyright contributors to the vLLM project - - -from . import vllm_v1_adapter - -__all__ = ["vllm_v1_adapter"] diff --git a/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/utils.py b/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/utils.py index 0e87dea59d..e0282c1552 100644 --- a/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/utils.py +++ b/vllm/distributed/kv_transfer/kv_connector/v1/lmcache_integration/utils.py @@ -131,7 +131,7 @@ def create_lmcache_metadata( # First Party from lmcache.config import LMCacheEngineMetadata - from vllm.utils.torch_utils import get_kv_cache_torch_dtype + from vllm.utils import get_kv_cache_torch_dtype config = lmcache_get_or_create_config() # Support both vllm_config object and individual config parameters