Skip to content

Commit a45eb9a

Browse files
Merge pull request #4927 from pmtk/rebase-ai-model_serving-2.20.0
USHIFT-5480: Rebase RHOAI to 2.20
2 parents 57ff22b + e9d7466 commit a45eb9a

File tree

10 files changed

+78
-39
lines changed

10 files changed

+78
-39
lines changed

assets/optional/ai-model-serving/kserve/inferenceservice-config-microshift-patch.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -40,7 +40,7 @@ data:
4040
"localGatewayService" : "kserve-local-gateway.istio-system.svc.cluster.local",
4141
"ingressDomain" : "example.com",
4242
"ingressClassName" : "istio",
43-
"domainTemplate": "{{ .Name }}-{{ .Namespace }}.{{ .IngressDomain }}",
43+
"domainTemplate": "example.com",
4444
"urlScheme": "https",
4545
"disableIstioVirtualHost": false,
4646
"disableIngressCreation": true

assets/optional/ai-model-serving/kserve/overlays/odh/inferenceservice-config-patch.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@ data:
3232
"localGatewayService" : "kserve-local-gateway.istio-system.svc.cluster.local",
3333
"ingressDomain" : "example.com",
3434
"ingressClassName" : "istio",
35-
"domainTemplate": "{{ .Name }}-{{ .Namespace }}.{{ .IngressDomain }}",
35+
"domainTemplate": "example.com",
3636
"urlScheme": "https",
3737
"disableIstioVirtualHost": false,
3838
"disableIngressCreation": true
Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
kserve-controller=quay.io/modh/kserve-controller@sha256:62aa39acd23cd8097fc48b5b30fe35572efb46adc5d04e4215aadb77193e71df
2-
kserve-agent=quay.io/modh/kserve-agent@sha256:84d037d1ad3126f089298460a380041e2f819ce3af3ff21fc781bbf6b6ea81e3
3-
kserve-router=quay.io/modh/kserve-router@sha256:9def4776bc51cd2d78f4d6d57fd707a207616de4f7064c1f9a440af3f42ce741
4-
kserve-storage-initializer=quay.io/modh/kserve-storage-initializer@sha256:d361e822b8db152f431d7be48ad5afb6e459497e61441da9db961a63d5e7b242
5-
oauth-proxy=registry.redhat.io/openshift4/ose-oauth-proxy@sha256:bd49cfc8452b3d96467cc222db9487e120abc6cc5ba81349c6b3703706f36a08
1+
kserve-controller=quay.io/modh/kserve-controller@sha256:ebd5b4f7c816fc297055ecf44e80e81a20c5b289c64c37b5a55fad3c4c98d63a
2+
kserve-agent=quay.io/modh/kserve-agent@sha256:bc135bada2f5817cfbd111c868341bff3ab9e426f7b321fbb2deda1396bd7c4b
3+
kserve-router=quay.io/modh/kserve-router@sha256:324e2dab6be2cadbdcf137c9da67f9eb6fb1416b1ed77a5b06e2af181369b230
4+
kserve-storage-initializer=quay.io/modh/kserve-storage-initializer@sha256:baaa0a63ab0c8345da3fcb12eb35c58233e07cb2bb16772c6721c2ed26aad7fd
5+
oauth-proxy=registry.redhat.io/openshift4/ose-oauth-proxy@sha256:bd49cfc8452b3d96467cc222db9487e120abc6cc5ba81349c6b3703706f36a08

assets/optional/ai-model-serving/kserve/rbac/role.yaml

Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -38,9 +38,17 @@ rules:
3838
- ""
3939
resources:
4040
- secrets
41+
verbs:
42+
- get
43+
- apiGroups:
44+
- ""
45+
resources:
4146
- serviceaccounts
4247
verbs:
48+
- create
49+
- delete
4350
- get
51+
- patch
4452
- apiGroups:
4553
- admissionregistration.k8s.io
4654
resources:
@@ -111,12 +119,24 @@ rules:
111119
- patch
112120
- update
113121
- watch
122+
- apiGroups:
123+
- rbac.authorization.k8s.io
124+
resourceNames:
125+
- kserve-inferencegraph-auth-verifiers
126+
resources:
127+
- clusterrolebindings
128+
verbs:
129+
- create
130+
- get
131+
- patch
132+
- update
114133
- apiGroups:
115134
- route.openshift.io
116135
resources:
117136
- routes
118137
verbs:
119138
- create
139+
- delete
120140
- get
121141
- list
122142
- patch
Lines changed: 13 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -1,20 +1,21 @@
11
{
22
"release": {
3-
"base": "2.19.0"
3+
"base": "2.20.0"
44
},
55
"images": {
6-
"caikit-tgis-image": "quay.io/modh/caikit-tgis-serving@sha256:2c7eef73708b5d73de33153459ac7238fdcf517cdc3544c775981f5814b4b6ed",
7-
"caikit-standalone-image": "quay.io/modh/caikit-nlp@sha256:ada8949b81e646809101edfc76738eb5aac362f783eb2facc8aeed21c7c1512f",
6+
"caikit-tgis-image": "quay.io/modh/caikit-tgis-serving@sha256:1d8a9fdd510020ed43ab19f333763257ca8bb1be9dcb330469baa7b110d8a6c8",
7+
"caikit-standalone-image": "quay.io/modh/caikit-nlp@sha256:7af5cfa5617723fc9039a01189e6e5e8d8d1d507cd015442588083a386618843",
88
"tgis-image": "quay.io/modh/text-generation-inference@sha256:aebf545d8048a59174f70334dc90c6b97ead4602a39cb7598ea68c8d199168a2",
9-
"ovms-image": "quay.io/modh/openvino_model_server@sha256:53b7fcf95de9b81e4c8652d0bf4e84e22d5b696827a5d951d863420c68b9cfe8",
10-
"vllm-cuda-image": "quay.io/modh/vllm@sha256:4f550996130e7d16cacb24ca9a2865e7cf51eddaab014ceaf31a1ea6ef86d4ec",
11-
"vllm-cpu-image": "quay.io/modh/vllm@sha256:881495befb6f807fa6e55f24e820fa67022b57d8ce0022305d89abe799c490fa",
12-
"vllm-gaudi-image": "quay.io/modh/vllm@sha256:af6a071be36d8a99476f145d1589d7ede97d2760b93335b14ca26de7417e438c",
13-
"vllm-rocm-image": "quay.io/modh/vllm@sha256:7e1d1985b0dd2b5ba2df41fc9c8c3edf13a2d9ed8a4d84db8f00eb6c753bc5c5",
14-
"kserve-controller": "quay.io/modh/kserve-controller@sha256:62aa39acd23cd8097fc48b5b30fe35572efb46adc5d04e4215aadb77193e71df",
15-
"kserve-agent": "quay.io/modh/kserve-agent@sha256:84d037d1ad3126f089298460a380041e2f819ce3af3ff21fc781bbf6b6ea81e3",
16-
"kserve-router": "quay.io/modh/kserve-router@sha256:9def4776bc51cd2d78f4d6d57fd707a207616de4f7064c1f9a440af3f42ce741",
17-
"kserve-storage-initializer": "quay.io/modh/kserve-storage-initializer@sha256:d361e822b8db152f431d7be48ad5afb6e459497e61441da9db961a63d5e7b242",
9+
"ovms-image": "quay.io/modh/openvino_model_server@sha256:428c00232cbf3b38a3929a0d22d0e13c6388ce353e3853cc2956d175eacf6724",
10+
"vllm-cuda-image": "quay.io/modh/vllm@sha256:e3e0f4ba3b78b53b3754bf63baf53bf22d9ec22fdc2974d4f2b5bdf8aeab276b",
11+
"ray-tls-generator-image": "registry.redhat.io/ubi9/ubi-minimal:latest",
12+
"vllm-cpu-image": "quay.io/modh/vllm@sha256:9e5f8f4394f599befb9e7f703e30581c4d7f062b8d4974992d6222837977ca5e",
13+
"vllm-gaudi-image": "quay.io/modh/vllm@sha256:e7cba648377c6fa29fab30481f97d96ccca76498aaf8bcf5162c74dfa4e0100c",
14+
"vllm-rocm-image": "quay.io/modh/vllm@sha256:de5d71c4fb6add81a01171bbabcd2e65fc2d75f0d6e57ca9ebcad9b4084db420",
15+
"kserve-controller": "quay.io/modh/kserve-controller@sha256:ebd5b4f7c816fc297055ecf44e80e81a20c5b289c64c37b5a55fad3c4c98d63a",
16+
"kserve-agent": "quay.io/modh/kserve-agent@sha256:bc135bada2f5817cfbd111c868341bff3ab9e426f7b321fbb2deda1396bd7c4b",
17+
"kserve-router": "quay.io/modh/kserve-router@sha256:324e2dab6be2cadbdcf137c9da67f9eb6fb1416b1ed77a5b06e2af181369b230",
18+
"kserve-storage-initializer": "quay.io/modh/kserve-storage-initializer@sha256:baaa0a63ab0c8345da3fcb12eb35c58233e07cb2bb16772c6721c2ed26aad7fd",
1819
"oauth-proxy": "registry.redhat.io/openshift4/ose-oauth-proxy@sha256:bd49cfc8452b3d96467cc222db9487e120abc6cc5ba81349c6b3703706f36a08"
1920
}
2021
}

assets/optional/ai-model-serving/runtimes/kustomization.x86_64.yaml

Lines changed: 10 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -2,25 +2,28 @@
22
images:
33
- name: caikit-tgis-image
44
newName: quay.io/modh/caikit-tgis-serving
5-
digest: sha256:2c7eef73708b5d73de33153459ac7238fdcf517cdc3544c775981f5814b4b6ed
5+
digest: sha256:1d8a9fdd510020ed43ab19f333763257ca8bb1be9dcb330469baa7b110d8a6c8
66
- name: caikit-standalone-image
77
newName: quay.io/modh/caikit-nlp
8-
digest: sha256:ada8949b81e646809101edfc76738eb5aac362f783eb2facc8aeed21c7c1512f
8+
digest: sha256:7af5cfa5617723fc9039a01189e6e5e8d8d1d507cd015442588083a386618843
99
- name: tgis-image
1010
newName: quay.io/modh/text-generation-inference
1111
digest: sha256:aebf545d8048a59174f70334dc90c6b97ead4602a39cb7598ea68c8d199168a2
1212
- name: ovms-image
1313
newName: quay.io/modh/openvino_model_server
14-
digest: sha256:53b7fcf95de9b81e4c8652d0bf4e84e22d5b696827a5d951d863420c68b9cfe8
14+
digest: sha256:428c00232cbf3b38a3929a0d22d0e13c6388ce353e3853cc2956d175eacf6724
1515
- name: vllm-cuda-image
1616
newName: quay.io/modh/vllm
17-
digest: sha256:4f550996130e7d16cacb24ca9a2865e7cf51eddaab014ceaf31a1ea6ef86d4ec
17+
digest: sha256:e3e0f4ba3b78b53b3754bf63baf53bf22d9ec22fdc2974d4f2b5bdf8aeab276b
18+
- name: ray-tls-generator-image
19+
newName: registry.redhat.io/ubi9/ubi-minimal:latest
20+
digest: registry.redhat.io/ubi9/ubi-minimal:latest
1821
- name: vllm-cpu-image
1922
newName: quay.io/modh/vllm
20-
digest: sha256:881495befb6f807fa6e55f24e820fa67022b57d8ce0022305d89abe799c490fa
23+
digest: sha256:9e5f8f4394f599befb9e7f703e30581c4d7f062b8d4974992d6222837977ca5e
2124
- name: vllm-gaudi-image
2225
newName: quay.io/modh/vllm
23-
digest: sha256:af6a071be36d8a99476f145d1589d7ede97d2760b93335b14ca26de7417e438c
26+
digest: sha256:e7cba648377c6fa29fab30481f97d96ccca76498aaf8bcf5162c74dfa4e0100c
2427
- name: vllm-rocm-image
2528
newName: quay.io/modh/vllm
26-
digest: sha256:7e1d1985b0dd2b5ba2df41fc9c8c3edf13a2d9ed8a4d84db8f00eb6c753bc5c5
29+
digest: sha256:de5d71c4fb6add81a01171bbabcd2e65fc2d75f0d6e57ca9ebcad9b4084db420
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,2 @@
11
#!/bin/bash -x
2-
./scripts/auto-rebase/rebase_ai_model_serving.sh to "registry.redhat.io/rhoai/odh-operator-bundle:v2.19"
2+
./scripts/auto-rebase/rebase_ai_model_serving.sh to "registry.redhat.io/rhoai/odh-operator-bundle:v2.20"

scripts/auto-rebase/rebase_ai_model_serving.sh

Lines changed: 12 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -198,6 +198,15 @@ EOF
198198
chmod +x "${last_rebase_script}"
199199
}
200200

201+
update_rebase_job_entrypoint_sh() {
202+
local -r operator_bundle="${1}"
203+
204+
title "Updating rebase_job_entrypoint.sh"
205+
sed -i \
206+
"s,^rhoai_release=.*\$,rhoai_release=\"${operator_bundle}\",g" \
207+
"${REPOROOT}/scripts/auto-rebase/rebase_job_entrypoint.sh"
208+
}
209+
201210
rebase_ai_model_serving_to() {
202211
local -r operator_bundle="${1}"
203212

@@ -207,10 +216,11 @@ rebase_ai_model_serving_to() {
207216
local -r version=$(get_rhoai_bundle_version)
208217

209218
update_last_rebase_ai_model_serving_sh "${operator_bundle}"
219+
update_rebase_job_entrypoint_sh "${operator_bundle}"
210220

211221
process_rhoai_manifests
212222

213-
if [[ -n "$(git status -s assets ./scripts/auto-rebase/last_rebase_ai_model_serving.sh)" ]]; then
223+
if [[ -n "$(git status -s ./assets ./scripts/auto-rebase/rebase_job_entrypoint.sh ./scripts/auto-rebase/last_rebase_ai_model_serving.sh)" ]]; then
214224
title "Detected changes to assets/ or last_rebase_ai_model_serving.sh"
215225

216226
if ! "${NO_BRANCH}"; then
@@ -220,7 +230,7 @@ rebase_ai_model_serving_to() {
220230
fi
221231

222232
title "Committing changes"
223-
git add assets ./scripts/auto-rebase/last_rebase_ai_model_serving.sh
233+
git add ./assets ./scripts/auto-rebase/rebase_job_entrypoint.sh ./scripts/auto-rebase/last_rebase_ai_model_serving.sh
224234
git commit -m "Update AI Model Serving for MicroShift"
225235
else
226236
title "No changes to assets/ or last_rebase_ai_model_serving.sh"

scripts/auto-rebase/rebase_job_entrypoint.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -75,7 +75,7 @@ pullspec_release_arm64="registry.ci.openshift.org/ocp-arm64/release-arm64:${rele
7575
#
7676
# New references can be obtained from:
7777
# https://catalog.redhat.com/software/containers/rhoai/odh-operator-bundle/659803ca929f3c931af06f28
78-
rhoai_release="registry.redhat.io/rhoai/odh-operator-bundle:v2.19"
78+
rhoai_release="registry.redhat.io/rhoai/odh-operator-bundle:v2.20"
7979

8080
APP_ID=$(cat /secrets/pr-creds/app_id) \
8181
KEY=/secrets/pr-creds/key.pem \

test/suites/ai-model-serving/ai-model-serving-offline.robot

Lines changed: 14 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -19,22 +19,27 @@ ${IP}= 10.44.0.1
1919
Sanity Test
2020
[Documentation] Sanity test for AI Model Serving
2121
22-
# Warning: Next keyword will fail if the VM was rebooted.
23-
# See https://github.com/kserve/kserve/pull/4274
24-
# After the issue is fixed and backported: add reboot and retest
25-
Wait For A Deployment test-ai openvino-resnet-predictor
26-
Wait Until Keyword Succeeds 10x 10s
27-
... Check If Model Is Ready
28-
Query Model Metrics
29-
Prepare Request Data
30-
Query Model Server
22+
Model Serving Offline Test
3123

3224
# Check if ingress exists.
3325
# Enabled only for testing purposes to test Kserve's settings override.
3426
offline.Run With Kubeconfig oc get ingress -n test-ai openvino-resnet
3527

28+
offline.Reboot MicroShift Host
29+
offline.Wait For Greenboot Health Check To Exit
30+
Model Serving Offline Test
31+
3632

3733
*** Keywords ***
34+
Model Serving Offline Test
35+
[Documentation] Waits for the model server and queries it
36+
Wait For A Deployment test-ai openvino-resnet-predictor
37+
Wait Until Keyword Succeeds 10x 10s
38+
... Check If Model Is Ready
39+
Query Model Metrics
40+
Prepare Request Data
41+
Query Model Server
42+
3843
Wait For A Deployment
3944
[Documentation] Wait for a deployment on offline VM
4045
[Arguments] ${namespace} ${name}

0 commit comments

Comments
 (0)