apiVersion: apps/v1 kind: Deployment metadata: name: server labels: app.kubernetes.io/component: server spec: replicas: 1 strategy: type: Recreate selector: matchLabels: app.kubernetes.io/component: server template: metadata: labels: app.kubernetes.io/component: server spec: affinity: nodeAffinity: requiredDuringSchedulingIgnoredDuringExecution: nodeSelectorTerms: - matchExpressions: # Image only supports amd64 - key: kubernetes.io/arch operator: In values: - amd64 runtimeClassName: nvidia containers: - name: kokoro-tts image: ghcr.io/remsky/kokoro-fastapi-gpu:v0.1.4 resources: requests: cpu: 500m memory: 1.5Gi limits: cpu: 1000m memory: 2Gi nvidia.com/gpu: "1"