Ollama version bump and enforce recreate due to GPU limitations

This commit is contained in:
JLP 2025-08-07 13:34:23 -04:00
parent c3e6921ad6
commit 348328f17c
Signed by: jleechpe
GPG key ID: 414E00D1FF7519DC
2 changed files with 8 additions and 1 deletions

View file

@ -1,6 +1,11 @@
apiVersion: kustomize.config.k8s.io/v1beta1 apiVersion: kustomize.config.k8s.io/v1beta1
kind: Kustomization kind: Kustomization
images:
- name: image
newName: ollama/ollama
newTag: 0.11.3
transformers: transformers:
- |- - |-
apiVersion: builtin apiVersion: builtin

View file

@ -3,6 +3,8 @@ kind: Deployment
metadata: metadata:
name: app name: app
spec: spec:
strategy:
type: Recreate # Needed since only 1 GPU
template: template:
spec: spec:
runtimeClassName: nvidia runtimeClassName: nvidia
@ -13,7 +15,7 @@ spec:
effect: "NoSchedule" effect: "NoSchedule"
containers: containers:
- name: ollama - name: ollama
image: ollama/ollama:0.6.7 image: image
imagePullPolicy: IfNotPresent imagePullPolicy: IfNotPresent
resources: resources:
limits: limits: