2020class AsyncEngineRPCServer :
2121
2222 def __init__ (self , async_engine_args : AsyncEngineArgs ,
23- usage_context : UsageContext , port : int ):
23+ usage_context : UsageContext , rpc_path : str ):
2424 # Initialize engine first.
2525 self .engine = AsyncLLMEngine .from_engine_args (async_engine_args ,
2626 usage_context )
@@ -30,9 +30,7 @@ def __init__(self, async_engine_args: AsyncEngineArgs,
3030
3131 # Init socket for readiness state.
3232 self .socket = self .context .socket (zmq .constants .ROUTER )
33- # Note numeric form of localhost should be used for zmq bind(),
34- # see https://stackoverflow.com/a/8958414
35- self .socket .bind (f"tcp://127.0.0.1:{ port } " )
33+ self .socket .bind (rpc_path )
3634
3735 def cleanup (self ):
3836 """Cleanup all resources."""
@@ -213,6 +211,6 @@ def signal_handler() -> None:
213211
214212
215213def run_rpc_server (async_engine_args : AsyncEngineArgs ,
216- usage_context : UsageContext , port : int ):
217- server = AsyncEngineRPCServer (async_engine_args , usage_context , port )
214+ usage_context : UsageContext , rpc_path : str ):
215+ server = AsyncEngineRPCServer (async_engine_args , usage_context , rpc_path )
218216 asyncio .run (run_server (server ))
0 commit comments