Skip to content

Commit 0b6c130

Browse files
committed
[aiconformance]: Install kuberay from helm
The kustomize version seems to have RBAC problems, particularly with webhooks.
1 parent 998620e commit 0b6c130

1 file changed

Lines changed: 12 additions & 3 deletions

File tree

tests/e2e/scenarios/ai-conformance/run-test.sh

Lines changed: 12 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -95,7 +95,7 @@ echo "----------------------------------------------------------------"
9595
echo "Installing Gateway API CRDs v1.2.0..."
9696
kubectl apply -f https://github.com/kubernetes-sigs/gateway-api/releases/download/v1.2.0/standard-install.yaml
9797

98-
# cert-manager: required for KubeRay webhooks
98+
# cert-manager
9999
echo "Installing cert-manager..."
100100
kubectl apply --server-side -f https://github.com/cert-manager/cert-manager/releases/download/v1.19.2/cert-manager.yaml
101101

@@ -171,8 +171,17 @@ helm upgrade -i nvidia-dra-driver-gpu nvidia/nvidia-dra-driver-gpu \
171171
--wait
172172

173173
# KubeRay
174+
# Use the Helm chart; the kustomize "default-with-webhooks" overlay has incomplete RBAC
175+
# (missing cluster-scope secrets permission), causing the operator to crash-loop.
176+
# The Helm chart does not support webhooks, so we install without them.
174177
echo "Installing KubeRay Operator..."
175-
kubectl apply --server-side -k "github.com/ray-project/kuberay/ray-operator/config/default-with-webhooks?ref=v1.5.0"
178+
helm repo add kuberay https://ray-project.github.io/kuberay-helm/
179+
helm repo update kuberay
180+
helm upgrade -i kuberay-operator kuberay/kuberay-operator \
181+
--version 1.5.0 \
182+
--namespace ray-system \
183+
--create-namespace \
184+
--wait
176185

177186
# Kueue
178187
echo "Installing Kueue..."
@@ -193,7 +202,7 @@ echo "Verifying Kueue..."
193202
kubectl rollout status deployment -n kueue-system kueue-controller-manager --timeout=5m || echo "Warning: Kueue not ready yet"
194203

195204
echo "Verifying KubeRay..."
196-
kubectl rollout status deployment -n kuberay-system kuberay-operator --timeout=5m || echo "Warning: KubeRay not ready yet"
205+
kubectl rollout status deployment -n ray-system kuberay-operator --timeout=5m || echo "Warning: KubeRay not ready yet"
197206

198207
echo "Verifying Gateway API..."
199208
kubectl get gatewayclass || echo "Warning: GatewayClass not found"

0 commit comments

Comments
 (0)