From c0d5bfcb5e9cae881f45f7bf734571960d4aa443 Mon Sep 17 00:00:00 2001 From: bdattoma Date: Fri, 13 Dec 2024 16:14:54 +0100 Subject: [PATCH] install AMD GPU certified operator --- .../Provisioning/GPU/AMD/amd_gpu_install.yaml | 10 ++--- .../Provisioning/GPU/AMD/amd_operator.sh | 38 ++++++++++++------- .../GPU/AMD/blacklist_driver.yaml | 2 +- 3 files changed, 31 insertions(+), 19 deletions(-) diff --git a/ods_ci/tasks/Resources/Provisioning/GPU/AMD/amd_gpu_install.yaml b/ods_ci/tasks/Resources/Provisioning/GPU/AMD/amd_gpu_install.yaml index e98c3ece4..b18a1a736 100644 --- a/ods_ci/tasks/Resources/Provisioning/GPU/AMD/amd_gpu_install.yaml +++ b/ods_ci/tasks/Resources/Provisioning/GPU/AMD/amd_gpu_install.yaml @@ -1,15 +1,15 @@ apiVersion: v1 kind: Namespace metadata: - name: openshift-amd-gpu + name: kube-amd-gpu --- apiVersion: operators.coreos.com/v1 kind: OperatorGroup metadata: - name: openshift-amd-gpu-operator-group - namespace: openshift-amd-gpu + name: kube-amd-gpu-operator-group + namespace: kube-amd-gpu spec: {} --- @@ -18,11 +18,11 @@ apiVersion: operators.coreos.com/v1alpha1 kind: Subscription metadata: name: amd-gpu-operator - namespace: openshift-amd-gpu + namespace: kube-amd-gpu spec: channel: alpha installPlanApproval: Automatic name: amd-gpu-operator - source: community-operators + source: certified-operators sourceNamespace: openshift-marketplace diff --git a/ods_ci/tasks/Resources/Provisioning/GPU/AMD/amd_operator.sh b/ods_ci/tasks/Resources/Provisioning/GPU/AMD/amd_operator.sh index 1f5c2e95c..416abc582 100755 --- a/ods_ci/tasks/Resources/Provisioning/GPU/AMD/amd_operator.sh +++ b/ods_ci/tasks/Resources/Provisioning/GPU/AMD/amd_operator.sh @@ -2,6 +2,8 @@ set -e GPU_INSTALL_DIR="$(dirname "$0")" +AMD_DC_NS="kube-amd-gpu" +ROCM_VERSION="6.2.2" function create_registry_network() { oc patch configs.imageregistry.operator.openshift.io cluster --type merge --patch '{"spec":{"storage":{"emptyDir":{}}}}' @@ -57,18 +59,28 @@ has_csv_succeeded() { function create_devconfig() { dc_name="dc-internal-registry" - dc=$(oc get DeviceConfig $dc_name -n openshift-amd-gpu -oname --ignore-not-found) + dc=$(oc get DeviceConfig $dc_name -n $AMD_DC_NS -oname --ignore-not-found) if [[ -n $dc ]]; then echo "AMD DeviceConfig $dc_name already exists". Skipping creation else echo "Creating AMD DeviceConfig..." oc create -f - <