add more servers
This commit is contained in:
@@ -1,10 +1,94 @@
|
||||
ollama:
|
||||
controllers:
|
||||
main:
|
||||
server-1:
|
||||
type: deployment
|
||||
labels:
|
||||
ollama-type: server
|
||||
replicas: 1
|
||||
strategy: Recreate
|
||||
revisionHistoryLimit: 3
|
||||
pod:
|
||||
affinity:
|
||||
podAntiAffinity:
|
||||
requiredDuringSchedulingIgnoredDuringExecution:
|
||||
- labelSelector:
|
||||
matchExpressions:
|
||||
- key: ollama-type
|
||||
operator: In
|
||||
values:
|
||||
- server
|
||||
containers:
|
||||
main:
|
||||
image:
|
||||
repository: ollama/ollama
|
||||
tag: 0.5.7
|
||||
pullPolicy: IfNotPresent
|
||||
env:
|
||||
- name: OLLAMA_KEEP_ALIVE
|
||||
value: 24h
|
||||
- name: OLLAMA_HOST
|
||||
value: 0.0.0.0
|
||||
resources:
|
||||
requests:
|
||||
cpu: 100m
|
||||
memory: 1Gi
|
||||
gpu.intel.com/i915: 1
|
||||
limits:
|
||||
cpu: 4
|
||||
gpu.intel.com/i915: 1
|
||||
server-2:
|
||||
type: deployment
|
||||
labels:
|
||||
ollama-type: server
|
||||
replicas: 1
|
||||
strategy: Recreate
|
||||
revisionHistoryLimit: 3
|
||||
pod:
|
||||
affinity:
|
||||
podAntiAffinity:
|
||||
requiredDuringSchedulingIgnoredDuringExecution:
|
||||
- labelSelector:
|
||||
matchExpressions:
|
||||
- key: ollama-type
|
||||
operator: In
|
||||
values:
|
||||
- server
|
||||
containers:
|
||||
main:
|
||||
image:
|
||||
repository: ollama/ollama
|
||||
tag: 0.5.7
|
||||
pullPolicy: IfNotPresent
|
||||
env:
|
||||
- name: OLLAMA_KEEP_ALIVE
|
||||
value: 24h
|
||||
- name: OLLAMA_HOST
|
||||
value: 0.0.0.0
|
||||
resources:
|
||||
requests:
|
||||
cpu: 100m
|
||||
memory: 1Gi
|
||||
gpu.intel.com/i915: 1
|
||||
limits:
|
||||
cpu: 4
|
||||
gpu.intel.com/i915: 1
|
||||
server-3:
|
||||
type: deployment
|
||||
labels:
|
||||
ollama-type: server
|
||||
replicas: 1
|
||||
strategy: Recreate
|
||||
revisionHistoryLimit: 3
|
||||
pod:
|
||||
affinity:
|
||||
podAntiAffinity:
|
||||
requiredDuringSchedulingIgnoredDuringExecution:
|
||||
- labelSelector:
|
||||
matchExpressions:
|
||||
- key: ollama-type
|
||||
operator: In
|
||||
values:
|
||||
- server
|
||||
containers:
|
||||
main:
|
||||
image:
|
||||
@@ -59,7 +143,7 @@ ollama:
|
||||
name: ollama-web-postgresql-17-cluster-app
|
||||
key: uri
|
||||
- name: OLLAMA_BASE_URL
|
||||
value: http://ollama-main.ollama:11434
|
||||
value: http://ollama-server-1.ollama:11434
|
||||
- name: ENABLE_OAUTH_SIGNUP
|
||||
value: true
|
||||
- name: OAUTH_USERNAME_CLAIM
|
||||
@@ -85,8 +169,22 @@ ollama:
|
||||
serviceAccount:
|
||||
create: true
|
||||
service:
|
||||
main:
|
||||
controller: main
|
||||
server-1:
|
||||
controller: server-1
|
||||
ports:
|
||||
http:
|
||||
port: 11434
|
||||
targetPort: 11434
|
||||
protocol: HTTP
|
||||
server-2:
|
||||
controller: server-2
|
||||
ports:
|
||||
http:
|
||||
port: 11434
|
||||
targetPort: 11434
|
||||
protocol: HTTP
|
||||
server-3:
|
||||
controller: server-3
|
||||
ports:
|
||||
http:
|
||||
port: 11434
|
||||
@@ -115,13 +213,33 @@ ollama:
|
||||
hosts:
|
||||
- ollama-cl01tl
|
||||
persistence:
|
||||
root:
|
||||
storageClass: ceph-block
|
||||
server-1:
|
||||
storageClass: ceph-block-delete
|
||||
accessMode: ReadWriteOnce
|
||||
size: 100Gi
|
||||
size: 40Gi
|
||||
retain: true
|
||||
advancedMounts:
|
||||
main:
|
||||
server-1:
|
||||
main:
|
||||
- path: /root/.ollama
|
||||
readOnly: false
|
||||
server-2:
|
||||
storageClass: ceph-block-delete
|
||||
accessMode: ReadWriteOnce
|
||||
size: 40Gi
|
||||
retain: true
|
||||
advancedMounts:
|
||||
server-2:
|
||||
main:
|
||||
- path: /root/.ollama
|
||||
readOnly: false
|
||||
server-3:
|
||||
storageClass: ceph-block-delete
|
||||
accessMode: ReadWriteOnce
|
||||
size: 40Gi
|
||||
retain: true
|
||||
advancedMounts:
|
||||
server-3:
|
||||
main:
|
||||
- path: /root/.ollama
|
||||
readOnly: false
|
||||
|
Reference in New Issue
Block a user