Skip to content

Commit 8f7a4b2

Browse files
committed
Remove redundant --http-port flag from launch scripts
Signed-off-by: Keiven Chang <[email protected]>
1 parent 3d35006 commit 8f7a4b2

File tree

9 files changed

+13
-9
lines changed

9 files changed

+13
-9
lines changed

examples/backends/sglang/launch/disagg_router.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,8 +12,8 @@ cleanup() {
1212
trap cleanup EXIT INT TERM
1313

1414
# run ingress
15+
# DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
1516
python3 -m dynamo.frontend \
16-
--http-port=${DYN_HTTP_PORT:-8000} \
1717
--router-mode kv \
1818
--kv-overlap-score-weight 0 \
1919
--router-reset-states &

examples/backends/trtllm/launch/agg_router.sh

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,8 @@ trap cleanup EXIT INT TERM
1919

2020

2121
# run frontend
22-
python3 -m dynamo.frontend --router-mode kv --http-port ${DYN_HTTP_PORT:-8000} &
22+
# DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
23+
python3 -m dynamo.frontend --router-mode kv &
2324
DYNAMO_PID=$!
2425

2526
# run worker

examples/backends/trtllm/launch/disagg_router.sh

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,8 @@ trap cleanup EXIT INT TERM
2222

2323

2424
# run frontend with KV routing for cache-aware optimization
25-
python3 -m dynamo.frontend --router-mode kv --http-port ${DYN_HTTP_PORT:-8000} &
25+
# DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
26+
python3 -m dynamo.frontend --router-mode kv &
2627
DYNAMO_PID=$!
2728

2829
# run prefill worker

examples/backends/trtllm/launch/gpt_oss_disagg.sh

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,8 @@ trap 'echo Cleaning up...; kill 0' EXIT
1414

1515

1616
# run frontend
17-
python3 -m dynamo.frontend --router-mode round-robin --http-port ${DYN_HTTP_PORT:-8000} &
17+
# DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
18+
python3 -m dynamo.frontend --router-mode round-robin &
1819

1920
# With tensor_parallel_size=4, each worker needs 4 GPUs
2021
# run prefill worker

examples/backends/vllm/launch/agg_kvbm_router.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,9 +11,9 @@ export PYTHONHASHSEED=0
1111
MODEL="Qwen/Qwen3-0.6B"
1212

1313
# run frontend + KV router
14+
# DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
1415
python -m dynamo.frontend \
1516
--router-mode kv \
16-
--http-port ${DYN_HTTP_PORT:-8000} \
1717
--router-reset-states &
1818

1919
# run workers with KVBM enabled

examples/backends/vllm/launch/agg_router.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,9 +12,9 @@ MODEL="Qwen/Qwen3-0.6B"
1212
BLOCK_SIZE=64
1313

1414
# run frontend + KV router
15+
# DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
1516
python -m dynamo.frontend \
1617
--router-mode kv \
17-
--http-port ${DYN_HTTP_PORT:-8000} \
1818
--router-reset-states &
1919

2020
# run workers

examples/backends/vllm/launch/disagg_kvbm_router.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,9 +11,9 @@ export PYTHONHASHSEED=0
1111
MODEL="Qwen/Qwen3-0.6B"
1212

1313
# run decode router with kv-overlap-score-weight 0 for pure load balancing
14+
# DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
1415
python -m dynamo.frontend \
1516
--router-mode kv \
16-
--http-port ${DYN_HTTP_PORT:-8000} \
1717
--kv-overlap-score-weight 0 \
1818
--router-reset-states &
1919

examples/backends/vllm/launch/disagg_router.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,9 +13,9 @@ BLOCK_SIZE=64
1313

1414
# Start frontend with KV routing
1515
# The frontend will automatically detect prefill workers and activate an internal prefill router
16+
# DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
1617
python -m dynamo.frontend \
1718
--router-mode kv \
18-
--http-port ${DYN_HTTP_PORT:-8000} \
1919
--router-reset-states &
2020

2121
# two decode workers

tests/serve/launch/template_verifier.sh

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,8 @@ cleanup() {
1717
trap cleanup EXIT INT TERM
1818

1919
# run ingress
20-
python3 -m dynamo.frontend --http-port=${DYN_HTTP_PORT:-8000} &
20+
# DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
21+
python3 -m dynamo.frontend &
2122
FRONTEND_PID=$!
2223

2324
# run the mock worker + template validation generate()

0 commit comments

Comments
 (0)