diff --git a/manifest.yaml b/manifest.yaml index 7784f95..0535df7 100644 --- a/manifest.yaml +++ b/manifest.yaml @@ -27,6 +27,7 @@ spec: app: text-classification tier: backend spec: + runtimeClassName: "nvidia" volumes: - name: text-classification-models persistentVolumeClaim: @@ -53,10 +54,10 @@ spec: - containerPort: 80 protocol: TCP name: http - # resources: - # requests: - # cpu: 1000m - # memory: 1024Mi + resources: + limits: + nvidia.com/gpu: "1" + nvidia.com/gpumem: "1000" volumeMounts: - mountPath: /app/models name: text-classification-models