Files
infrastructure/clusters/cl01tl/platform/ollama/values.yaml
Renovate Bot 34d6b073d6
Some checks failed
renovate/stability-days Updates have met minimum release age requirement
lint-test-helm / helm-lint (pull_request) Successful in 11s
lint-test-helm / helm-lint (push) Has been cancelled
renovate / renovate (push) Has been cancelled
Update ollama/ollama Docker tag to v0.9.4
2025-07-02 16:01:38 +00:00

264 lines
7.2 KiB
YAML

ollama:
controllers:
server-1:
type: deployment
replicas: 1
strategy: Recreate
revisionHistoryLimit: 3
pod:
labels:
ollama-type: server
affinity:
podAntiAffinity:
requiredDuringSchedulingIgnoredDuringExecution:
- labelSelector:
matchExpressions:
- key: ollama-type
operator: In
values:
- server
topologyKey: kubernetes.io/hostname
containers:
main:
image:
repository: ollama/ollama
tag: 0.9.4
pullPolicy: IfNotPresent
env:
- name: OLLAMA_KEEP_ALIVE
value: 24h
- name: OLLAMA_HOST
value: 0.0.0.0
resources:
limits:
gpu.intel.com/i915: 1
requests:
cpu: 100m
memory: 1Gi
gpu.intel.com/i915: 1
server-2:
type: deployment
replicas: 1
strategy: Recreate
revisionHistoryLimit: 3
pod:
labels:
ollama-type: server
affinity:
podAntiAffinity:
requiredDuringSchedulingIgnoredDuringExecution:
- labelSelector:
matchExpressions:
- key: ollama-type
operator: In
values:
- server
topologyKey: kubernetes.io/hostname
containers:
main:
image:
repository: ollama/ollama
tag: 0.9.4
pullPolicy: IfNotPresent
env:
- name: OLLAMA_KEEP_ALIVE
value: 24h
- name: OLLAMA_HOST
value: 0.0.0.0
resources:
limits:
gpu.intel.com/i915: 1
requests:
cpu: 100m
memory: 1Gi
gpu.intel.com/i915: 1
server-3:
type: deployment
replicas: 1
strategy: Recreate
revisionHistoryLimit: 3
pod:
labels:
ollama-type: server
affinity:
podAntiAffinity:
requiredDuringSchedulingIgnoredDuringExecution:
- labelSelector:
matchExpressions:
- key: ollama-type
operator: In
values:
- server
topologyKey: kubernetes.io/hostname
containers:
main:
image:
repository: ollama/ollama
tag: 0.9.4
pullPolicy: IfNotPresent
env:
- name: OLLAMA_KEEP_ALIVE
value: 24h
- name: OLLAMA_HOST
value: 0.0.0.0
resources:
limits:
gpu.intel.com/i915: 1
requests:
cpu: 100m
memory: 1Gi
gpu.intel.com/i915: 1
web:
type: deployment
replicas: 1
strategy: Recreate
revisionHistoryLimit: 3
containers:
main:
image:
repository: ghcr.io/open-webui/open-webui
tag: v0.6.15
pullPolicy: IfNotPresent
env:
- name: ENV
value: prod
- name: WEBUI_AUTH
value: true
- name: WEBUI_NAME
value: Ollama
- name: WEBUI_URL
value: http://ollama.alexlebens.net
- name: ENABLE_LOGIN_FORM
value: false
- name: DEFAULT_USER_ROLE
value: admin
- name: WEBUI_SECRET_KEY
valueFrom:
secretKeyRef:
name: ollama-key-secret
key: key
- name: DATABASE_URL
valueFrom:
secretKeyRef:
name: ollama-web-postgresql-17-cluster-app
key: uri
- name: OLLAMA_BASE_URL
value: http://ollama-server-1.ollama:11434
- name: ENABLE_OAUTH_SIGNUP
value: true
- name: OAUTH_USERNAME_CLAIM
value: preferred_username
- name: OAUTH_CLIENT_SECRET
valueFrom:
secretKeyRef:
name: ollama-oidc-secret
key: secret
- name: OAUTH_CLIENT_ID
valueFrom:
secretKeyRef:
name: ollama-oidc-secret
key: client
- name: OAUTH_PROVIDER_NAME
value: Authentik
- name: OPENID_PROVIDER_URL
value: https://authentik.alexlebens.net/application/o/ollama/.well-known/openid-configuration
resources:
requests:
cpu: 10m
memory: 1Gi
service:
server-1:
controller: server-1
ports:
http:
port: 11434
targetPort: 11434
protocol: HTTP
server-2:
controller: server-2
ports:
http:
port: 11434
targetPort: 11434
protocol: HTTP
server-3:
controller: server-3
ports:
http:
port: 11434
targetPort: 11434
protocol: HTTP
web:
controller: web
ports:
http:
port: 80
targetPort: 8080
protocol: HTTP
persistence:
server-1:
storageClass: ceph-block
accessMode: ReadWriteOnce
size: 40Gi
retain: true
advancedMounts:
server-1:
main:
- path: /root/.ollama
readOnly: false
server-2:
storageClass: ceph-block
accessMode: ReadWriteOnce
size: 40Gi
retain: true
advancedMounts:
server-2:
main:
- path: /root/.ollama
readOnly: false
server-3:
storageClass: ceph-block
accessMode: ReadWriteOnce
size: 40Gi
retain: true
advancedMounts:
server-3:
main:
- path: /root/.ollama
readOnly: false
web-data:
storageClass: ceph-block
accessMode: ReadWriteOnce
size: 5Gi
retain: true
advancedMounts:
web:
main:
- path: /app/backend/data
readOnly: false
postgres-17-cluster:
nameOverride: ollama-web-postgresql-17
mode: standalone
cluster:
storage:
storageClass: local-path
walStorage:
storageClass: local-path
monitoring:
enabled: true
prometheusRule:
enabled: true
recovery:
method: objectStore
objectStore:
endpointURL: https://nyc3.digitaloceanspaces.com
destinationPath: s3://postgres-backups-ce540ddf106d186bbddca68a/cl01tl/ollama/ollama-web-postgresql-17-cluster
endpointCredentials: ollama-web-postgresql-17-cluster-backup-secret
recoveryIndex: 2
backup:
enabled: true
endpointURL: https://nyc3.digitaloceanspaces.com
destinationPath: s3://postgres-backups-ce540ddf106d186bbddca68a/cl01tl/ollama/ollama-web-postgresql-17-cluster
endpointCredentials: ollama-web-postgresql-17-cluster-backup-secret
backupIndex: 2