Skip to content
This repository was archived by the owner on Oct 11, 2024. It is now read-only.

Commit b290035

Browse files
njhillRobert Shaw
authored andcommitted
[Core] Move ray_utils.py from engine to executor package (vllm-project#4347)
1 parent e207f23 commit b290035

File tree

7 files changed

+11
-9
lines changed

7 files changed

+11
-9
lines changed

vllm/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,8 +3,8 @@
33
from vllm.engine.arg_utils import AsyncEngineArgs, EngineArgs
44
from vllm.engine.async_llm_engine import AsyncLLMEngine
55
from vllm.engine.llm_engine import LLMEngine
6-
from vllm.engine.ray_utils import initialize_ray_cluster
76
from vllm.entrypoints.llm import LLM
7+
from vllm.executor.ray_utils import initialize_ray_cluster
88
from vllm.model_executor.models import ModelRegistry
99
from vllm.outputs import CompletionOutput, RequestOutput
1010
from vllm.sampling_params import SamplingParams

vllm/engine/async_llm_engine.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010
from vllm.config import ModelConfig
1111
from vllm.engine.arg_utils import AsyncEngineArgs
1212
from vllm.engine.llm_engine import LLMEngine
13-
from vllm.engine.ray_utils import initialize_ray_cluster, ray
13+
from vllm.executor.ray_utils import initialize_ray_cluster, ray
1414
from vllm.logger import init_logger
1515
from vllm.lora.request import LoRARequest
1616
from vllm.outputs import RequestOutput

vllm/engine/llm_engine.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,8 +15,8 @@
1515
SequenceGroupOutputProcessor)
1616
from vllm.engine.output_processor.stop_checker import StopChecker
1717
from vllm.engine.output_processor.util import create_output_by_sequence_group
18-
from vllm.engine.ray_utils import initialize_ray_cluster
1918
from vllm.executor.executor_base import ExecutorBase
19+
from vllm.executor.ray_utils import initialize_ray_cluster
2020
from vllm.logger import init_logger
2121
from vllm.lora.request import LoRARequest
2222
from vllm.outputs import RequestOutput

vllm/executor/ray_gpu_executor.py

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -5,8 +5,8 @@
55
from itertools import islice, repeat
66
from typing import TYPE_CHECKING, Any, Dict, List, Optional, Set, Tuple
77

8-
from vllm.engine.ray_utils import RayWorkerWrapper, ray
98
from vllm.executor.executor_base import ExecutorAsyncBase, ExecutorBase
9+
from vllm.executor.ray_utils import RayWorkerWrapper, ray
1010
from vllm.logger import init_logger
1111
from vllm.lora.request import LoRARequest
1212
from vllm.sequence import SamplerOutput, SequenceGroupMetadata
@@ -74,7 +74,7 @@ def _init_workers_ray(self, placement_group: "PlacementGroup",
7474

7575
# The driver dummy worker does not actually use any resources.
7676
# It holds the resource for the driver worker.
77-
self.driver_dummy_worker: RayWorkerWrapper = None
77+
self.driver_dummy_worker: Optional[RayWorkerWrapper] = None
7878
# The remaining workers are the actual ray actors.
7979
self.workers: List[RayWorkerWrapper] = []
8080

@@ -318,6 +318,7 @@ def _run_workers(
318318
driver_worker_output = self.driver_worker.execute_method(
319319
method, *driver_args, **driver_kwargs)
320320
else:
321+
assert self.driver_dummy_worker is not None
321322
driver_worker_output = ray.get(
322323
self.driver_dummy_worker.execute_method.remote(
323324
method, *driver_args, **driver_kwargs))
@@ -353,8 +354,9 @@ def _compiled_ray_dag(self):
353354
# a dummy value for now. It will be fixed soon.
354355
with InputNode() as input_data:
355356
forward_dag = MultiOutputNode([
356-
worker.execute_model_compiled_dag_remote.bind(input_data)
357-
for worker in self.workers
357+
worker.execute_model_compiled_dag_remote.
358+
bind( # type: ignore[attr-defined]
359+
input_data) for worker in self.workers
358360
])
359361
return forward_dag.experimental_compile()
360362

File renamed without changes.

vllm/transformers_utils/tokenizer_group/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
from typing import Optional
22

33
from vllm.config import TokenizerPoolConfig
4-
from vllm.engine.ray_utils import ray
4+
from vllm.executor.ray_utils import ray
55
from vllm.transformers_utils.tokenizer_group.base_tokenizer_group import (
66
BaseTokenizerGroup)
77
from vllm.transformers_utils.tokenizer_group.tokenizer_group import (

vllm/transformers_utils/tokenizer_group/ray_tokenizer_group.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@
66
from transformers import PreTrainedTokenizer
77

88
from vllm.config import TokenizerPoolConfig
9-
from vllm.engine.ray_utils import ray
9+
from vllm.executor.ray_utils import ray
1010
from vllm.lora.request import LoRARequest
1111
from vllm.transformers_utils.tokenizer_group.base_tokenizer_group import (
1212
BaseTokenizerGroup)

0 commit comments

Comments
 (0)