This commit is contained in:
ivamp 2024-11-06 02:03:15 +08:00
parent 69067d948f
commit d49f0c1fb3

View File

@ -27,6 +27,7 @@ spec:
app: text-classification
tier: backend
spec:
runtimeClassName: "nvidia"
volumes:
- name: text-classification-models
persistentVolumeClaim:
@ -53,10 +54,10 @@ spec:
- containerPort: 80
protocol: TCP
name: http
# resources:
# requests:
# cpu: 1000m
# memory: 1024Mi
resources:
limits:
nvidia.com/gpu: "1"
nvidia.com/gpumem: "1000"
volumeMounts:
- mountPath: /app/models
name: text-classification-models