Ollama version bump and enforce recreate due to GPU limitations
This commit is contained in:
parent
c3e6921ad6
commit
348328f17c
2 changed files with 8 additions and 1 deletions
|
@ -1,6 +1,11 @@
|
|||
apiVersion: kustomize.config.k8s.io/v1beta1
|
||||
kind: Kustomization
|
||||
|
||||
images:
|
||||
- name: image
|
||||
newName: ollama/ollama
|
||||
newTag: 0.11.3
|
||||
|
||||
transformers:
|
||||
- |-
|
||||
apiVersion: builtin
|
||||
|
|
|
@ -3,6 +3,8 @@ kind: Deployment
|
|||
metadata:
|
||||
name: app
|
||||
spec:
|
||||
strategy:
|
||||
type: Recreate # Needed since only 1 GPU
|
||||
template:
|
||||
spec:
|
||||
runtimeClassName: nvidia
|
||||
|
@ -13,7 +15,7 @@ spec:
|
|||
effect: "NoSchedule"
|
||||
containers:
|
||||
- name: ollama
|
||||
image: ollama/ollama:0.6.7
|
||||
image: image
|
||||
imagePullPolicy: IfNotPresent
|
||||
resources:
|
||||
limits:
|
||||
|
|
Loading…
Add table
Reference in a new issue