Skip to content

Commit 9f21ac6

Browse files
authored
Deploy Kueue configured with AppWrapper as an externalFramework (#172)
1 parent edc2ba1 commit 9f21ac6

File tree

3 files changed

+47
-1
lines changed

3 files changed

+47
-1
lines changed

hack/deploy-kueue.sh

+8-1
Original file line numberDiff line numberDiff line change
@@ -18,8 +18,15 @@ KUEUE_VERSION=v0.7.0
1818

1919
export ROOT_DIR="$(dirname "$(dirname "$(readlink -fn "$0")")")"
2020

21+
echo "Downloading and patching Kueue ${KUEUE_VERSION} manifests"
22+
wget -q https://github.com/kubernetes-sigs/kueue/releases/download/${KUEUE_VERSION}/manifests.yaml -O $ROOT_DIR/hack/kueue-manifest.yaml
23+
patch -p 0 $ROOT_DIR/hack/kueue-manifest.yaml < $ROOT_DIR/hack/kueue-patches/01-manage-all-jobs.txt || exit 1
24+
patch -p 0 $ROOT_DIR/hack/kueue-manifest.yaml < $ROOT_DIR/hack/kueue-patches/02-aw-external-frameworks.txt || exit 1
25+
2126
echo "Deploying Kueue version $KUEUE_VERSION"
22-
kubectl apply --server-side -f https://github.com/kubernetes-sigs/kueue/releases/download/${KUEUE_VERSION}/manifests.yaml
27+
kubectl apply --server-side -f $ROOT_DIR/hack/kueue-manifest.yaml
28+
29+
rm -f $ROOT_DIR/hack/kueue-manifest.yaml
2330

2431
# Sleep until the kueue manager is running
2532
echo "Waiting for pods in the kueue-system namespace to become ready"
+11
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
--- manifests.yaml 2024-06-26 13:58:48.132795505 -0400
2+
+++ manifests.yaml 2024-06-26 13:59:54.945553273 -0400
3+
@@ -11878,7 +11878,7 @@
4+
# backoffLimitCount: null # null indicates infinite requeuing
5+
# backoffBaseSeconds: 60
6+
# backoffMaxSeconds: 3600
7+
- #manageJobsWithoutQueueName: true
8+
+ manageJobsWithoutQueueName: true
9+
#internalCertManagement:
10+
# enable: false
11+
# webhookServiceName: ""
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
--- manifests.yaml 2024-06-26 13:59:54.945553273 -0400
2+
+++ manifests.yaml 2024-06-26 14:02:25.889855296 -0400
3+
@@ -11225,6 +11225,14 @@
4+
- get
5+
- list
6+
- watch
7+
+- apiGroups:
8+
+ - workload.codeflare.dev
9+
+ resources:
10+
+ - appwrappers
11+
+ verbs:
12+
+ - get
13+
+ - list
14+
+ - watch
15+
---
16+
apiVersion: rbac.authorization.k8s.io/v1
17+
kind: ClusterRole
18+
@@ -11896,8 +11904,8 @@
19+
- "kubeflow.org/tfjob"
20+
- "kubeflow.org/xgboostjob"
21+
# - "pod"
22+
- # externalFrameworks:
23+
- # - "Foo.v1.example.com"
24+
+ externalFrameworks:
25+
+ - "AppWrapper.v1beta2.workload.codeflare.dev"
26+
# podOptions:
27+
# namespaceSelector:
28+
# matchExpressions:

0 commit comments

Comments
 (0)