Skip to content
Merged
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
7 changes: 6 additions & 1 deletion python/sglang/compile_deep_gemm.py
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@

import requests

from sglang.srt.disaggregation.utils import FAKE_BOOTSTRAP_HOST
Comment thread
lbh2001 marked this conversation as resolved.
from sglang.srt.entrypoints.http_server import launch_server
from sglang.srt.managers.io_struct import GenerateReqInput
from sglang.srt.managers.tokenizer_manager import TokenizerManager
Expand Down Expand Up @@ -52,7 +53,7 @@ def from_cli_args(cls, args: argparse.Namespace):


@warmup("compile-deep-gemm")
async def warm_up_compile(tokenizer_manager: TokenizerManager):
async def warm_up_compile(disaggregation_mode: str, tokenizer_manager: TokenizerManager):
print("\nGenerate warm up request for compiling DeepGEMM...\n")
generate_req_input = GenerateReqInput(
input_ids=[0, 1, 2, 3],
Expand All @@ -62,6 +63,10 @@ async def warm_up_compile(tokenizer_manager: TokenizerManager):
"ignore_eos": True,
},
)
if disaggregation_mode != "null":
Comment thread
lbh2001 marked this conversation as resolved.
generate_req_input.bootstrap_room = 0
generate_req_input.bootstrap_host = FAKE_BOOTSTRAP_HOST

await tokenizer_manager.generate_request(generate_req_input, None).__anext__()


Expand Down