@@ -45,16 +45,16 @@ if [ "$ENABLE_OTEL" = true ]; then
4545fi
4646
4747# run ingress
48+ # dynamo.frontend accepts either --http-port flag or DYN_HTTP_PORT env var (defaults to 8000)
4849OTEL_SERVICE_NAME=dynamo-frontend \
4950python3 -m dynamo.frontend \
50- --http-port=8000 \
5151 --router-mode kv \
5252 --kv-overlap-score-weight 0 \
5353 --router-reset-states &
5454DYNAMO_PID=$!
5555
5656# run prefill router
57- OTEL_SERVICE_NAME=dynamo-router-prefill DYN_SYSTEM_PORT=8081 \
57+ OTEL_SERVICE_NAME=dynamo-router-prefill DYN_SYSTEM_PORT=${DYN_SYSTEM_PORT_PREFILL_ROUTER :- 8081} \
5858python3 -m dynamo.router \
5959 --endpoint dynamo.prefill.generate \
6060 --block-size 64 \
@@ -63,7 +63,7 @@ python3 -m dynamo.router \
6363PREFILL_ROUTER_PID=$!
6464
6565# run prefill worker
66- OTEL_SERVICE_NAME=dynamo-worker-prefill-1 DYN_SYSTEM_PORT=8082 \
66+ OTEL_SERVICE_NAME=dynamo-worker-prefill-1 DYN_SYSTEM_PORT=${DYN_SYSTEM_PORT_PREFILL_WORKER1 :- 8082} \
6767python3 -m dynamo.sglang \
6868 --model-path deepseek-ai/DeepSeek-R1-Distill-Llama-8B \
6969 --served-model-name deepseek-ai/DeepSeek-R1-Distill-Llama-8B \
@@ -78,7 +78,7 @@ python3 -m dynamo.sglang \
7878PREFILL_PID=$!
7979
8080# run prefill worker
81- OTEL_SERVICE_NAME=dynamo-worker-prefill-2 DYN_SYSTEM_PORT=8083 \
81+ OTEL_SERVICE_NAME=dynamo-worker-prefill-2 DYN_SYSTEM_PORT=${DYN_SYSTEM_PORT_PREFILL_WORKER2 :- 8083} \
8282CUDA_VISIBLE_DEVICES=1 python3 -m dynamo.sglang \
8383 --model-path deepseek-ai/DeepSeek-R1-Distill-Llama-8B \
8484 --served-model-name deepseek-ai/DeepSeek-R1-Distill-Llama-8B \
@@ -93,7 +93,7 @@ CUDA_VISIBLE_DEVICES=1 python3 -m dynamo.sglang \
9393PREFILL_PID=$!
9494
9595# run decode worker
96- OTEL_SERVICE_NAME=dynamo-worker-decode-1 DYN_SYSTEM_PORT=8084 \
96+ OTEL_SERVICE_NAME=dynamo-worker-decode-1 DYN_SYSTEM_PORT=${DYN_SYSTEM_PORT_DECODE_WORKER1 :- 8084} \
9797CUDA_VISIBLE_DEVICES=3 python3 -m dynamo.sglang \
9898 --model-path deepseek-ai/DeepSeek-R1-Distill-Llama-8B \
9999 --served-model-name deepseek-ai/DeepSeek-R1-Distill-Llama-8B \
@@ -108,7 +108,7 @@ CUDA_VISIBLE_DEVICES=3 python3 -m dynamo.sglang \
108108PREFILL_PID=$!
109109
110110# run decode worker
111- OTEL_SERVICE_NAME=dynamo-worker-decode-2 DYN_SYSTEM_PORT=8085 \
111+ OTEL_SERVICE_NAME=dynamo-worker-decode-2 DYN_SYSTEM_PORT=${DYN_SYSTEM_PORT_DECODE_WORKER2 :- 8085} \
112112CUDA_VISIBLE_DEVICES=2 python3 -m dynamo.sglang \
113113 --model-path deepseek-ai/DeepSeek-R1-Distill-Llama-8B \
114114 --served-model-name deepseek-ai/DeepSeek-R1-Distill-Llama-8B \
0 commit comments