apiVersion: serving.kserve.io/v1alpha1 kind: ClusterServingRuntime metadata: name: nvidia-nim-nvclip namespace: default spec: containers: - env: - name: NIM_CACHE_PATH value: /tmp - name: NGC_API_KEY valueFrom: secretKeyRef: name: nvidia-nim-secrets key: NGC_API_KEY image: upmdev.azurecr.io/nim/nvidia/nvclip:latest name: kserve-container ports: - containerPort: 8000 protocol: TCP resources: limits: cpu: "8" memory: 24Gi requests: cpu: "8" memory: 24Gi volumeMounts: - mountPath: /dev/shm name: dshm imagePullSecrets: - name: edb-cred protocolVersions: - v2 - grpc-v2 supportedModelFormats: - autoSelect: true name: nvidia-nim-nvclip priority: 1 version: "latest" volumes: - emptyDir: medium: Memory sizeLimit: 20Gi name: dshm