|
@@ -35,12 +35,13 @@ from aphrodite.inputs import INPUT_REGISTRY, InputRegistry
|
|
|
from aphrodite.lora.layers import LoRAMapping
|
|
|
from aphrodite.lora.request import LoRARequest
|
|
|
from aphrodite.lora.worker_manager import LRUCacheWorkerLoRAManager
|
|
|
-from aphrodite.modeling import SamplingMetadata, SamplingMetadataCache
|
|
|
from aphrodite.modeling.model_loader import get_model
|
|
|
from aphrodite.modeling.model_loader.tensorizer import TensorizerConfig
|
|
|
from aphrodite.modeling.models.interfaces import (supports_lora,
|
|
|
supports_multimodal)
|
|
|
from aphrodite.modeling.models.utils import set_cpu_offload_max_bytes
|
|
|
+from aphrodite.modeling.sampling_metadata import (SamplingMetadata,
|
|
|
+ SamplingMetadataCache)
|
|
|
from aphrodite.multimodal import (MULTIMODAL_REGISTRY, BatchedTensorInputs,
|
|
|
MultiModalInputs, MultiModalRegistry)
|
|
|
from aphrodite.prompt_adapter.layers import PromptAdapterMapping
|