|
29 | 29 | RELEASE_TAG="v${MAJOR}.${MINOR}.0-rc.${RC}" |
30 | 30 | fi |
31 | 31 |
|
32 | | -# vLLM image version (default to 0.7.2 if not defined) |
33 | | -VLLM="${VLLM:-0.7.2}" |
| 32 | +# The vLLM image versions |
| 33 | +# The GPU image is from https://hub.docker.com/layers/vllm/vllm-openai |
| 34 | +VLLM_GPU="${VLLM_GPU:-0.9.1}" |
| 35 | +# The CPU image is from https://gallery.ecr.aws/q9t5s3a7/vllm-cpu-release-repo |
| 36 | +VLLM_CPU="${VLLM_CPU:-0.9.1}" |
| 37 | +# The sim image is from https://github.com/llm-d/llm-d-inference-sim/pkgs/container/llm-d-inference-sim |
| 38 | +VLLM_SIM="${VLLM_SIM:-0.1.1}" |
34 | 39 |
|
35 | 40 | echo "Using release tag: ${RELEASE_TAG}" |
36 | | -echo "Using vLLM image version: ${VLLM}" |
| 41 | +echo "Using vLLM GPU image version: ${VLLM_GPU}" |
| 42 | +echo "Using vLLM CPU image version: ${VLLM_CPU}" |
| 43 | +echo "Using vLLM Simulator image version: ${VLLM_SIM}" |
37 | 44 |
|
38 | 45 | # ----------------------------------------------------------------------------- |
39 | 46 | # Update pkg/README.md |
@@ -64,30 +71,48 @@ sed -i.bak -E "s|(tag: )[^\"[:space:]]+|\1${RELEASE_TAG}|g" "$EPP_HELM" |
64 | 71 | sed -i.bak -E "s|(tag: )[^\"[:space:]]+|\1${RELEASE_TAG}|g" "$BBR_HELM" |
65 | 72 |
|
66 | 73 | # Update the container image pull policy. |
67 | | -sed -i.bak '/us-central1-docker.pkg.dev\/k8s-staging-images\/gateway-api-inference-extension\/epp/ { n; s/Always/IfNotPresent/ }' "$EPP" |
| 74 | +sed -i.bak '/us-central1-docker.pkg.dev\/k8s-staging-images\/gateway-api-inference-extension\/epp/{n;s/Always/IfNotPresent/;}' "$EPP" |
68 | 75 |
|
69 | 76 | # Update the container registry. |
70 | 77 | sed -i.bak -E "s|us-central1-docker\.pkg\.dev/k8s-staging-images|registry.k8s.io|g" "$EPP" |
71 | 78 | sed -i.bak -E "s|us-central1-docker\.pkg\.dev/k8s-staging-images|registry.k8s.io|g" "$EPP_HELM" |
72 | 79 | sed -i.bak -E "s|us-central1-docker\.pkg\.dev/k8s-staging-images|registry.k8s.io|g" "$BBR_HELM" |
73 | 80 |
|
74 | 81 | # ----------------------------------------------------------------------------- |
75 | | -# Update config/manifests/vllm/gpu-deployment.yaml |
| 82 | +# Update vLLM deployment manifests |
76 | 83 | # ----------------------------------------------------------------------------- |
77 | | -VLLM_DEPLOY="config/manifests/vllm/gpu-deployment.yaml" |
78 | | -echo "Updating ${VLLM_DEPLOY} ..." |
| 84 | +VLLM_GPU_DEPLOY="config/manifests/vllm/gpu-deployment.yaml" |
| 85 | +echo "Updating ${VLLM_GPU_DEPLOY} ..." |
79 | 86 |
|
80 | | -# Update the vLLM image version |
81 | | -sed -i.bak -E "s|(vllm/vllm-openai:)[^\"[:space:]]+|\1v${VLLM}|g" "$VLLM_DEPLOY" |
| 87 | +# Update the vLLM GPU image version |
| 88 | +sed -i.bak -E "s|(vllm/vllm-openai:)[^\"[:space:]]+|\1v${VLLM_GPU}|g" "$VLLM_GPU_DEPLOY" |
82 | 89 |
|
83 | 90 | # Also change the imagePullPolicy from Always to IfNotPresent on lines containing the vLLM image. |
84 | | -sed -i.bak '/vllm\/vllm-openai/ { n; s/Always/IfNotPresent/ }' "$VLLM_DEPLOY" |
| 91 | +sed -i.bak '/vllm\/vllm-openai/{n;s/Always/IfNotPresent/;}' "$VLLM_GPU_DEPLOY" |
| 92 | + |
| 93 | +VLLM_CPU_DEPLOY="config/manifests/vllm/cpu-deployment.yaml" |
| 94 | +echo "Updating ${VLLM_CPU_DEPLOY} ..." |
| 95 | + |
| 96 | +# Update the vLLM CPU image version |
| 97 | +sed -i.bak -E "s|(q9t5s3a7/vllm-cpu-release-repo:)[^\"[:space:]]+|\1v${VLLM_CPU}|g" "$VLLM_CPU_DEPLOY" |
| 98 | + |
| 99 | +# Also change the imagePullPolicy from Always to IfNotPresent on lines containing the vLLM CPU image. |
| 100 | +sed -i.bak '/q9t5s3a7\/vllm-cpu-release-repo/{n;s/Always/IfNotPresent/;}' "$VLLM_CPU_DEPLOY" |
| 101 | + |
| 102 | +VLLM_SIM_DEPLOY="config/manifests/vllm/sim-deployment.yaml" |
| 103 | +echo "Updating ${VLLM_SIM_DEPLOY} ..." |
| 104 | + |
| 105 | +# Update the vLLM Simulator image version |
| 106 | +sed -i.bak -E "s|(llm-d/llm-d-inference-sim:)[^\"[:space:]]+|\1v${VLLM_SIM}|g" "$VLLM_SIM_DEPLOY" |
| 107 | + |
| 108 | +# Also change the imagePullPolicy from Always to IfNotPresent on lines containing the vLLM image. |
| 109 | +sed -i.bak '/llm-d\/llm-d-inference-sim/{n;s/Always/IfNotPresent/;}' "$VLLM_SIM_DEPLOY" |
85 | 110 |
|
86 | 111 | # ----------------------------------------------------------------------------- |
87 | 112 | # Stage the changes |
88 | 113 | # ----------------------------------------------------------------------------- |
89 | | -echo "Staging $README $EPP $EPP_HELM $BBR_HELM $VLLM_DEPLOY files..." |
90 | | -git add $README $EPP $EPP_HELM $BBR_HELM $VLLM_DEPLOY |
| 114 | +echo "Staging $README $EPP $EPP_HELM $BBR_HELM $VLLM_GPU_DEPLOY $VLLM_CPU_DEPLOY $VLLM_SIM_DEPLOY files..." |
| 115 | +git add $README $EPP $EPP_HELM $BBR_HELM $VLLM_GPU_DEPLOY $VLLM_CPU_DEPLOY $VLLM_SIM_DEPLOY |
91 | 116 |
|
92 | 117 | # ----------------------------------------------------------------------------- |
93 | 118 | # Cleanup backup files and finish |
|
0 commit comments