diff --git a/vllm/platforms/cuda.py b/vllm/platforms/cuda.py index 962e2b3aab60..aafc157534db 100644 --- a/vllm/platforms/cuda.py +++ b/vllm/platforms/cuda.py @@ -182,9 +182,6 @@ def check_and_update_config(cls, vllm_config: "VllmConfig") -> None: compilation_config.use_cudagraph = False if model_config is not None: model_config.enforce_eager = True - # TODO (varun): Turning this ON gives incorrect results for the - # Deepseek-V2-lite model. - vllm_config.compilation_config.use_inductor = False @classmethod def get_current_memory_usage(cls,