File tree Expand file tree Collapse file tree 9 files changed +13
-9
lines changed
Expand file tree Collapse file tree 9 files changed +13
-9
lines changed Original file line number Diff line number Diff line change @@ -12,8 +12,8 @@ cleanup() {
1212trap cleanup EXIT INT TERM
1313
1414# run ingress
15+ # DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
1516python3 -m dynamo.frontend \
16- --http-port=${DYN_HTTP_PORT:- 8000} \
1717 --router-mode kv \
1818 --kv-overlap-score-weight 0 \
1919 --router-reset-states &
Original file line number Diff line number Diff line change @@ -19,7 +19,8 @@ trap cleanup EXIT INT TERM
1919
2020
2121# run frontend
22- python3 -m dynamo.frontend --router-mode kv --http-port ${DYN_HTTP_PORT:- 8000} &
22+ # DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
23+ python3 -m dynamo.frontend --router-mode kv &
2324DYNAMO_PID=$!
2425
2526# run worker
Original file line number Diff line number Diff line change @@ -22,7 +22,8 @@ trap cleanup EXIT INT TERM
2222
2323
2424# run frontend with KV routing for cache-aware optimization
25- python3 -m dynamo.frontend --router-mode kv --http-port ${DYN_HTTP_PORT:- 8000} &
25+ # DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
26+ python3 -m dynamo.frontend --router-mode kv &
2627DYNAMO_PID=$!
2728
2829# run prefill worker
Original file line number Diff line number Diff line change @@ -14,7 +14,8 @@ trap 'echo Cleaning up...; kill 0' EXIT
1414
1515
1616# run frontend
17- python3 -m dynamo.frontend --router-mode round-robin --http-port ${DYN_HTTP_PORT:- 8000} &
17+ # DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
18+ python3 -m dynamo.frontend --router-mode round-robin &
1819
1920# With tensor_parallel_size=4, each worker needs 4 GPUs
2021# run prefill worker
Original file line number Diff line number Diff line change @@ -11,9 +11,9 @@ export PYTHONHASHSEED=0
1111MODEL=" Qwen/Qwen3-0.6B"
1212
1313# run frontend + KV router
14+ # DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
1415python -m dynamo.frontend \
1516 --router-mode kv \
16- --http-port ${DYN_HTTP_PORT:- 8000} \
1717 --router-reset-states &
1818
1919# run workers with KVBM enabled
Original file line number Diff line number Diff line change @@ -12,9 +12,9 @@ MODEL="Qwen/Qwen3-0.6B"
1212BLOCK_SIZE=64
1313
1414# run frontend + KV router
15+ # DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
1516python -m dynamo.frontend \
1617 --router-mode kv \
17- --http-port ${DYN_HTTP_PORT:- 8000} \
1818 --router-reset-states &
1919
2020# run workers
Original file line number Diff line number Diff line change @@ -11,9 +11,9 @@ export PYTHONHASHSEED=0
1111MODEL=" Qwen/Qwen3-0.6B"
1212
1313# run decode router with kv-overlap-score-weight 0 for pure load balancing
14+ # DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
1415python -m dynamo.frontend \
1516 --router-mode kv \
16- --http-port ${DYN_HTTP_PORT:- 8000} \
1717 --kv-overlap-score-weight 0 \
1818 --router-reset-states &
1919
Original file line number Diff line number Diff line change @@ -13,9 +13,9 @@ BLOCK_SIZE=64
1313
1414# Start frontend with KV routing
1515# The frontend will automatically detect prefill workers and activate an internal prefill router
16+ # DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
1617python -m dynamo.frontend \
1718 --router-mode kv \
18- --http-port ${DYN_HTTP_PORT:- 8000} \
1919 --router-reset-states &
2020
2121# two decode workers
Original file line number Diff line number Diff line change @@ -17,7 +17,8 @@ cleanup() {
1717trap cleanup EXIT INT TERM
1818
1919# run ingress
20- python3 -m dynamo.frontend --http-port=${DYN_HTTP_PORT:- 8000} &
20+ # DYN_HTTP_PORT env var is read by dynamo.frontend (defaults to 8000 if not set)
21+ python3 -m dynamo.frontend &
2122FRONTEND_PID=$!
2223
2324# run the mock worker + template validation generate()
You can’t perform that action at this time.
0 commit comments