apiVersion: apps/v1 kind: Deployment metadata: name: litellm spec: selector: matchLabels: app.kubernetes.io/component: litellm template: metadata: labels: app.kubernetes.io/component: litellm spec: affinity: nodeAffinity: requiredDuringSchedulingIgnoredDuringExecution: nodeSelectorTerms: - matchExpressions: # Image only supports amd64 - key: kubernetes.io/arch operator: In values: - amd64 containers: - name: litellm image: ghcr.io/berriai/litellm:main-latest args: ['--config', '/config/config.yml'] resources: requests: memory: 200Mi cpu: 200m limits: memory: 200Mi cpu: 200m ports: - containerPort: 8000 name: http volumeMounts: - name: litellm-config mountPath: /config volumes: - name: litellm-config configMap: name: litellm-config --- apiVersion: v1 kind: Service metadata: name: litellm labels: app.kubernetes.io/component: litellm spec: selector: app.kubernetes.io/component: litellm ports: - name: http port: 8000 targetPort: http