1
0
Fork 0

assign extra nvida gpu to ollama

This commit is contained in:
Massaki Archambault 2024-08-17 14:16:16 -04:00
parent 7060126ca7
commit 53b77ba489
3 changed files with 5 additions and 3 deletions

View File

@ -29,7 +29,6 @@ spec:
containers:
- name: server
image: ollama/ollama
# image: badjware/ollama-tweak
env:
- name: OLLAMA_KEEP_ALIVE
value: 36h
@ -44,7 +43,8 @@ spec:
limits:
memory: 4Gi
cpu: 3000m
nvidia.com/gpu: 1
nvidia.com/gpu: "2"
# amd.com/gpu: "1"
ports:
- name: http
hostPort: 11434

View File

@ -36,7 +36,8 @@ images:
- name: bitnami/kubectl
newTag: "1.29"
- name: ollama/ollama
newTag: 0.3.3
newTag: 0.3.6
# newTag: 0.3.6-rocm
- name: ghcr.io/berriai/litellm
newTag: main-v1.43.1
- name: ghcr.io/open-webui/open-webui

View File

@ -2,5 +2,6 @@ resources:
- ../../bases/longhorn
- ../../bases/traefik
- ../../bases/external-secrets
# - ../../bases/k8s-device-plugin-amd
- ../../bases/k8s-device-plugin-nvidia
- clustersecretstore.yaml