Add OVMS OOTB with GPU support (#1262)

* Add openvino with GPU support * Update display name of gpu * Use one image for both OOTB
opendatahub-io · May 19, 2023 · 5d92707 · shalberd · Jun 3, 2023 · lucferbux
1 parent 40cd8a4
commit 5d92707
Show file tree

Hide file tree

Showing 3 changed files with 66 additions and 4 deletions.
diff --git a/manifests/modelserving/kustomization.yaml b/manifests/modelserving/kustomization.yaml
@@ -4,8 +4,9 @@ commonLabels:
   app: odh-dashboard
   app.kubernetes.io/part-of: odh-dashboard
 resources:
-  -  servingruntimes-template.yaml
+  -  ovms-ootb.yaml
+  -  ovms-gpu-ootb.yaml
 images:
-- name: ovms-1
-  newName: quay.io/opendatahub/openvino_model_server
-  digest: sha256:20dbfbaf53d1afbd47c612d953984238cb0e207972ed544a5ea662c2404f276d
+  - name: ovms-1
+    newName: quay.io/opendatahub/openvino_model_server
+    digest: sha256:20dbfbaf53d1afbd47c612d953984238cb0e207972ed544a5ea662c2404f276d
diff --git a/manifests/modelserving/ovms-gpu-ootb.yaml b/manifests/modelserving/ovms-gpu-ootb.yaml
@@ -0,0 +1,60 @@
+kind: Template
+apiVersion: template.openshift.io/v1
+metadata:
+  name: ovms-gpu
+  labels:
+    opendatahub.io/dashboard: 'true'
+    opendatahub.io/ootb: 'true'
+    opendatahub.io/configurable: 'true'
+  annotations:
+    tags: 'ovms,servingruntime'
+    description: 'OpenVino with GPU Support Model Serving Definition'
+objects:
+  - apiVersion: serving.kserve.io/v1alpha1
+    kind: ServingRuntime
+    metadata:
+      name: ovms-gpu
+      annotations:
+        openshift.io/display-name: 'OpenVINO Model Server (Supports GPUs)'
+      labels:
+        opendatahub.io/dashboard: 'true'
+    spec:
+      builtInAdapter:
+        env:
+          - name: OVMS_FORCE_TARGET_DEVICE
+            value: NVIDIA
+        memBufferBytes: 134217728
+        modelLoadingTimeoutMillis: 90000
+        runtimeManagementPort: 8888
+        serverType: ovms
+      containers:
+        - args:
+            - '--port=8001'
+            - '--rest_port=8888'
+            - '--config_path=/models/model_config_list.json'
+            - '--file_system_poll_wait_seconds=0'
+            - '--grpc_bind_address=127.0.0.1'
+            - '--rest_bind_address=127.0.0.1'
+          image: ovms-1
+          name: ovms
+          resources:
+            limits:
+              cpu: '0'
+              memory: 0Gi
+            requests:
+              cpu: '0'
+              memory: 0Gi
+      grpcDataEndpoint: 'port:8001'
+      grpcEndpoint: 'port:8085'
+      multiModel: true
+      protocolVersions:
+        - grpc-v1
+      replicas: 1
+      supportedModelFormats:
+        - autoSelect: true
+          name: openvino_ir
+          version: opset1
+        - autoSelect: true
+          name: onnx
+          version: '1'
+parameters: []
diff --git a/...odelserving/servingruntimes-template.yaml → manifests/modelserving/ovms-ootb.yaml b/...odelserving/servingruntimes-template.yaml → manifests/modelserving/ovms-ootb.yaml
@@ -16,6 +16,7 @@ objects:
       name: ovms
       annotations:
         openshift.io/display-name: 'OpenVINO Model Server'
+        opendatahub.io/disable-gpu: 'true'
       labels:
         opendatahub.io/dashboard: 'true'
     spec: