|
9 | 9 |
|
10 | 10 | import vllm.envs as envs |
11 | 11 | from vllm.config import (CacheConfig, CompilationConfig, ConfigFormat, |
12 | | - DecodingConfig, DeviceConfig, HfOverrides, LoadConfig, |
13 | | - LoadFormat, LoRAConfig, ModelConfig, |
14 | | - ObservabilityConfig, ParallelConfig, PoolerConfig, |
15 | | - PromptAdapterConfig, SchedulerConfig, |
| 12 | + DecodingConfig, DeviceConfig, HfOverrides, |
| 13 | + KVTransferConfig, LoadConfig, LoadFormat, LoRAConfig, |
| 14 | + ModelConfig, ObservabilityConfig, ParallelConfig, |
| 15 | + PoolerConfig, PromptAdapterConfig, SchedulerConfig, |
16 | 16 | SpeculativeConfig, TaskOption, TokenizerPoolConfig, |
17 | | - VllmConfig, KVTransferConfig) |
| 17 | + VllmConfig) |
18 | 18 | from vllm.executor.executor_base import ExecutorBase |
19 | 19 | from vllm.logger import init_logger |
20 | 20 | from vllm.model_executor.layers.quantization import QUANTIZATION_METHODS |
|
0 commit comments