Skip to content

Commit 4c4130e

Browse files
authored
chore: typo and new commands (#3617)
1 parent 5744548 commit 4c4130e

File tree

2 files changed

+3
-7
lines changed

2 files changed

+3
-7
lines changed

components/backends/sglang/deploy/disagg.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -61,7 +61,7 @@ spec:
6161
image: my-registry/sglang-runtime:my-tag
6262
workingDir: /workspace/components/backends/sglang
6363
command:
64-
- python3E
64+
- python3
6565
- -m
6666
- dynamo.sglang
6767
args:

components/backends/sglang/launch/disagg_dp_attn.sh

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -16,10 +16,6 @@ trap cleanup EXIT INT TERM
1616
python3 -m dynamo.frontend --http-port=8000 &
1717
DYNAMO_PID=$!
1818

19-
# Set the expert distribution recording directory
20-
mkdir -p /tmp/sglang_expert_distribution_record
21-
export SGLANG_EXPERT_DISTRIBUTION_RECORDER_DIR=/tmp/sglang_expert_distribution_record
22-
2319
# run prefill worker
2420
python3 -m dynamo.sglang \
2521
--model-path silence09/DeepSeek-R1-Small-2layers \
@@ -31,7 +27,7 @@ python3 -m dynamo.sglang \
3127
--trust-remote-code \
3228
--disaggregation-mode prefill \
3329
--disaggregation-transfer-backend nixl \
34-
--expert-distribution-recorder-mode stat \
30+
--load-balance-method round_robin \
3531
--port 30000 &
3632
PREFILL_PID=$!
3733

@@ -46,5 +42,5 @@ CUDA_VISIBLE_DEVICES=2,3 python3 -m dynamo.sglang \
4642
--trust-remote-code \
4743
--disaggregation-mode decode \
4844
--disaggregation-transfer-backend nixl \
49-
--expert-distribution-recorder-mode stat \
45+
--prefill-round-robin-balance \
5046
--port 31000

0 commit comments

Comments
 (0)