Improve disagg-example.sh (#8)

tlrmchlsmth · web-flow · commit 7a1f25f71452 · 2025-04-21T13:57:29.000-04:00
- fix spelling
- CUDA_VISIBLE_DEVICES should be set externally

Signed-off-by: Tyler Michael Smith &lt;tyler@neuralmagic.com&gt;
diff --git a/examples/other/LMCache/disagg-example.sh b/examples/other/LMCache/disagg-example.sh
@@ -3,7 +3,7 @@
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 
 if [[ $# -lt 1 ]]; then
-    echo "Usage: $0 <prefiller | decoder | proxy> [model]"
+    echo "Usage: $0 <prefill | decode | proxy> [model]"
     exit 1
 fi
 
@@ -16,7 +16,7 @@ else
 fi
 
 
-if [[ $1 == "prefiller" ]]; then
+if [[ $1 == "prefill" ]]; then
     # Prefiller listens on port 8100
     prefill_config_file=$SCRIPT_DIR/configs/lmcache-prefiller-config.yaml
 
@@ -25,7 +25,6 @@ if [[ $1 == "prefiller" ]]; then
         LMCACHE_USE_EXPERIMENTAL=True \
         VLLM_ENABLE_V1_MULTIPROCESSING=1 \
         VLLM_WORKER_MULTIPROC_METHOD=spawn \
-        CUDA_VISIBLE_DEVICES=6 \
         vllm serve $MODEL \
         --port 8100 \
         --enforce-eager \
@@ -36,7 +35,7 @@ if [[ $1 == "prefiller" ]]; then
     # LMCACHE_LOG_LEVEL=DEBUG -- Set log level to DEBUG
     # --enforce-eager -- Enforce eager mode
 
-elif [[ $1 == "decoder" ]]; then
+elif [[ $1 == "decode" ]]; then
     # Decoder listens on port 8200
     decode_config_file=$SCRIPT_DIR/configs/lmcache-decoder-config.yaml
 
@@ -45,7 +44,6 @@ elif [[ $1 == "decoder" ]]; then
         LMCACHE_USE_EXPERIMENTAL=True \
         VLLM_ENABLE_V1_MULTIPROCESSING=1 \
         VLLM_WORKER_MULTIPROC_METHOD=spawn \
-        CUDA_VISIBLE_DEVICES=7 \
         vllm serve $MODEL \
         --port 8200 \
         --enforce-eager \