@@ -95,7 +95,7 @@ echo "----------------------------------------------------------------"
9595echo " Installing Gateway API CRDs v1.2.0..."
9696kubectl apply -f https://github.com/kubernetes-sigs/gateway-api/releases/download/v1.2.0/standard-install.yaml
9797
98- # cert-manager: required for KubeRay webhooks
98+ # cert-manager
9999echo " Installing cert-manager..."
100100kubectl apply --server-side -f https://github.com/cert-manager/cert-manager/releases/download/v1.19.2/cert-manager.yaml
101101
@@ -171,8 +171,17 @@ helm upgrade -i nvidia-dra-driver-gpu nvidia/nvidia-dra-driver-gpu \
171171 --wait
172172
173173# KubeRay
174+ # Use the Helm chart; the kustomize "default-with-webhooks" overlay has incomplete RBAC
175+ # (missing cluster-scope secrets permission), causing the operator to crash-loop.
176+ # The Helm chart does not support webhooks, so we install without them.
174177echo " Installing KubeRay Operator..."
175- kubectl apply --server-side -k " github.com/ray-project/kuberay/ray-operator/config/default-with-webhooks?ref=v1.5.0"
178+ helm repo add kuberay https://ray-project.github.io/kuberay-helm/
179+ helm repo update kuberay
180+ helm upgrade -i kuberay-operator kuberay/kuberay-operator \
181+ --version 1.5.0 \
182+ --namespace ray-system \
183+ --create-namespace \
184+ --wait
176185
177186# Kueue
178187echo " Installing Kueue..."
@@ -193,7 +202,7 @@ echo "Verifying Kueue..."
193202kubectl rollout status deployment -n kueue-system kueue-controller-manager --timeout=5m || echo " Warning: Kueue not ready yet"
194203
195204echo " Verifying KubeRay..."
196- kubectl rollout status deployment -n kuberay -system kuberay-operator --timeout=5m || echo " Warning: KubeRay not ready yet"
205+ kubectl rollout status deployment -n ray -system kuberay-operator --timeout=5m || echo " Warning: KubeRay not ready yet"
197206
198207echo " Verifying Gateway API..."
199208kubectl get gatewayclass || echo " Warning: GatewayClass not found"
0 commit comments