2025-01-31 17:03:48 -05:00
|
|
|
apiVersion: apps/v1
|
|
|
|
kind: Deployment
|
|
|
|
metadata:
|
|
|
|
name: app
|
|
|
|
spec:
|
|
|
|
template:
|
|
|
|
spec:
|
|
|
|
runtimeClassName: nvidia
|
|
|
|
tolerations:
|
|
|
|
- key: "gpu"
|
|
|
|
operator: "Equal"
|
|
|
|
value: "true"
|
|
|
|
effect: "NoSchedule"
|
|
|
|
containers:
|
|
|
|
- name: ollama
|
2025-04-06 20:43:05 -04:00
|
|
|
image: ollama/ollama:0.6.4
|
2025-03-11 20:39:33 -04:00
|
|
|
imagePullPolicy: IfNotPresent
|
2025-01-31 17:03:48 -05:00
|
|
|
resources:
|
|
|
|
limits:
|
|
|
|
nvidia.com/gpu: 1
|
|
|
|
ports:
|
|
|
|
- name: ollama
|
|
|
|
containerPort: 11434
|
|
|
|
protocol: TCP
|
|
|
|
volumeMounts:
|
|
|
|
- mountPath: /root/.ollama
|
|
|
|
name: ollama-data
|
|
|
|
livenessProbe:
|
|
|
|
httpGet:
|
|
|
|
path: /
|
|
|
|
port: ollama
|
|
|
|
readinessProbe:
|
|
|
|
httpGet:
|
|
|
|
path: /
|
|
|
|
port: ollama
|
|
|
|
|
|
|
|
volumes:
|
|
|
|
- name: ollama-data
|
|
|
|
persistentVolumeClaim:
|
|
|
|
claimName: ollama-pvc
|