File tree Expand file tree Collapse file tree 1 file changed +8
-1
lines changed Expand file tree Collapse file tree 1 file changed +8
-1
lines changed Original file line number Diff line number Diff line change 17
17
18
18
import requests
19
19
20
+ from sglang .srt .disaggregation .utils import FAKE_BOOTSTRAP_HOST
20
21
from sglang .srt .entrypoints .http_server import launch_server
21
22
from sglang .srt .managers .io_struct import GenerateReqInput
22
23
from sglang .srt .managers .tokenizer_manager import TokenizerManager
@@ -52,7 +53,9 @@ def from_cli_args(cls, args: argparse.Namespace):
52
53
53
54
54
55
@warmup ("compile-deep-gemm" )
55
- async def warm_up_compile (tokenizer_manager : TokenizerManager ):
56
+ async def warm_up_compile (
57
+ disaggregation_mode : str , tokenizer_manager : TokenizerManager
58
+ ):
56
59
print ("\n Generate warm up request for compiling DeepGEMM...\n " )
57
60
generate_req_input = GenerateReqInput (
58
61
input_ids = [0 , 1 , 2 , 3 ],
@@ -62,6 +65,10 @@ async def warm_up_compile(tokenizer_manager: TokenizerManager):
62
65
"ignore_eos" : True ,
63
66
},
64
67
)
68
+ if disaggregation_mode != "null" :
69
+ generate_req_input .bootstrap_room = 0
70
+ generate_req_input .bootstrap_host = FAKE_BOOTSTRAP_HOST
71
+
65
72
await tokenizer_manager .generate_request (generate_req_input , None ).__anext__ ()
66
73
67
74
You can’t perform that action at this time.
0 commit comments