Skip to content

Commit

Permalink
Add openvino with GPU support
Browse files Browse the repository at this point in the history
  • Loading branch information
lucferbux committed May 19, 2023
1 parent 0d3144a commit 89ede09
Show file tree
Hide file tree
Showing 3 changed files with 69 additions and 4 deletions.
12 changes: 8 additions & 4 deletions manifests/modelserving/kustomization.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,12 @@ commonLabels:
app: odh-dashboard
app.kubernetes.io/part-of: odh-dashboard
resources:
- servingruntimes-template.yaml
- ovms-ootb.yaml
- ovms-gpu-ootb.yaml
images:
- name: ovms-1
newName: quay.io/opendatahub/openvino_model_server
digest: sha256:20dbfbaf53d1afbd47c612d953984238cb0e207972ed544a5ea662c2404f276d
- name: ovms-1
newName: quay.io/opendatahub/openvino_model_server
digest: sha256:20dbfbaf53d1afbd47c612d953984238cb0e207972ed544a5ea662c2404f276d
- name: ovms-gpu-1
newName: quay.io/modh/openvino-model-server
digest: sha256:c89f76386bc8b59f0748cf173868e5beef21ac7d2f78dada69089c4d37c44116
60 changes: 60 additions & 0 deletions manifests/modelserving/ovms-gpu-ootb.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,60 @@
kind: Template
apiVersion: template.openshift.io/v1
metadata:
name: ovms-gpu
labels:
opendatahub.io/dashboard: 'true'
opendatahub.io/ootb: 'true'
opendatahub.io/configurable: 'true'
annotations:
tags: 'ovms,servingruntime'
description: 'OpenVino with GPU Support Model Serving Definition'
objects:
- apiVersion: serving.kserve.io/v1alpha1
kind: ServingRuntime
metadata:
name: ovms-gpu
annotations:
openshift.io/display-name: 'OpenVINO Model Server [GPU]'
labels:
opendatahub.io/dashboard: 'true'
spec:
builtInAdapter:
env:
- name: OVMS_FORCE_TARGET_DEVICE
value: NVIDIA
memBufferBytes: 134217728
modelLoadingTimeoutMillis: 90000
runtimeManagementPort: 8888
serverType: ovms
containers:
- args:
- '--port=8001'
- '--rest_port=8888'
- '--config_path=/models/model_config_list.json'
- '--file_system_poll_wait_seconds=0'
- '--grpc_bind_address=127.0.0.1'
- '--rest_bind_address=127.0.0.1'
image: ovms-gpu-1
name: ovms
resources:
limits:
cpu: '0'
memory: 0Gi
requests:
cpu: '0'
memory: 0Gi
grpcDataEndpoint: 'port:8001'
grpcEndpoint: 'port:8085'
multiModel: true
protocolVersions:
- grpc-v1
replicas: 1
supportedModelFormats:
- autoSelect: true
name: openvino_ir
version: opset1
- autoSelect: true
name: onnx
version: '1'
parameters: []
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@ metadata:
opendatahub.io/dashboard: 'true'
opendatahub.io/ootb: 'true'
opendatahub.io/configurable: 'true'
opendatahub.io/disable-gpu: 'true'
annotations:
tags: 'ovms,servingruntime'
description: 'OpenVino Model Serving Definition'
Expand Down

0 comments on commit 89ede09

Please sign in to comment.