40 lines
1005 B
YAML
40 lines
1005 B
YAML
apiVersion: apps/v1
|
|
kind: Deployment
|
|
metadata:
|
|
name: server
|
|
labels:
|
|
app.kubernetes.io/component: server
|
|
spec:
|
|
replicas: 1
|
|
strategy:
|
|
type: Recreate
|
|
selector:
|
|
matchLabels:
|
|
app.kubernetes.io/component: server
|
|
template:
|
|
metadata:
|
|
labels:
|
|
app.kubernetes.io/component: server
|
|
spec:
|
|
affinity:
|
|
nodeAffinity:
|
|
requiredDuringSchedulingIgnoredDuringExecution:
|
|
nodeSelectorTerms:
|
|
- matchExpressions:
|
|
# Image only supports amd64
|
|
- key: kubernetes.io/arch
|
|
operator: In
|
|
values:
|
|
- amd64
|
|
runtimeClassName: nvidia
|
|
containers:
|
|
- name: kokoro-tts
|
|
image: ghcr.io/remsky/kokoro-fastapi-gpu:v0.1.4
|
|
resources:
|
|
requests:
|
|
cpu: 500m
|
|
memory: 1.5Gi
|
|
limits:
|
|
cpu: 1000m
|
|
memory: 2Gi
|
|
nvidia.com/gpu: "1" |