add more servers
This commit is contained in:
@@ -1,10 +1,94 @@
|
|||||||
ollama:
|
ollama:
|
||||||
controllers:
|
controllers:
|
||||||
main:
|
server-1:
|
||||||
type: deployment
|
type: deployment
|
||||||
|
labels:
|
||||||
|
ollama-type: server
|
||||||
replicas: 1
|
replicas: 1
|
||||||
strategy: Recreate
|
strategy: Recreate
|
||||||
revisionHistoryLimit: 3
|
revisionHistoryLimit: 3
|
||||||
|
pod:
|
||||||
|
affinity:
|
||||||
|
podAntiAffinity:
|
||||||
|
requiredDuringSchedulingIgnoredDuringExecution:
|
||||||
|
- labelSelector:
|
||||||
|
matchExpressions:
|
||||||
|
- key: ollama-type
|
||||||
|
operator: In
|
||||||
|
values:
|
||||||
|
- server
|
||||||
|
containers:
|
||||||
|
main:
|
||||||
|
image:
|
||||||
|
repository: ollama/ollama
|
||||||
|
tag: 0.5.7
|
||||||
|
pullPolicy: IfNotPresent
|
||||||
|
env:
|
||||||
|
- name: OLLAMA_KEEP_ALIVE
|
||||||
|
value: 24h
|
||||||
|
- name: OLLAMA_HOST
|
||||||
|
value: 0.0.0.0
|
||||||
|
resources:
|
||||||
|
requests:
|
||||||
|
cpu: 100m
|
||||||
|
memory: 1Gi
|
||||||
|
gpu.intel.com/i915: 1
|
||||||
|
limits:
|
||||||
|
cpu: 4
|
||||||
|
gpu.intel.com/i915: 1
|
||||||
|
server-2:
|
||||||
|
type: deployment
|
||||||
|
labels:
|
||||||
|
ollama-type: server
|
||||||
|
replicas: 1
|
||||||
|
strategy: Recreate
|
||||||
|
revisionHistoryLimit: 3
|
||||||
|
pod:
|
||||||
|
affinity:
|
||||||
|
podAntiAffinity:
|
||||||
|
requiredDuringSchedulingIgnoredDuringExecution:
|
||||||
|
- labelSelector:
|
||||||
|
matchExpressions:
|
||||||
|
- key: ollama-type
|
||||||
|
operator: In
|
||||||
|
values:
|
||||||
|
- server
|
||||||
|
containers:
|
||||||
|
main:
|
||||||
|
image:
|
||||||
|
repository: ollama/ollama
|
||||||
|
tag: 0.5.7
|
||||||
|
pullPolicy: IfNotPresent
|
||||||
|
env:
|
||||||
|
- name: OLLAMA_KEEP_ALIVE
|
||||||
|
value: 24h
|
||||||
|
- name: OLLAMA_HOST
|
||||||
|
value: 0.0.0.0
|
||||||
|
resources:
|
||||||
|
requests:
|
||||||
|
cpu: 100m
|
||||||
|
memory: 1Gi
|
||||||
|
gpu.intel.com/i915: 1
|
||||||
|
limits:
|
||||||
|
cpu: 4
|
||||||
|
gpu.intel.com/i915: 1
|
||||||
|
server-3:
|
||||||
|
type: deployment
|
||||||
|
labels:
|
||||||
|
ollama-type: server
|
||||||
|
replicas: 1
|
||||||
|
strategy: Recreate
|
||||||
|
revisionHistoryLimit: 3
|
||||||
|
pod:
|
||||||
|
affinity:
|
||||||
|
podAntiAffinity:
|
||||||
|
requiredDuringSchedulingIgnoredDuringExecution:
|
||||||
|
- labelSelector:
|
||||||
|
matchExpressions:
|
||||||
|
- key: ollama-type
|
||||||
|
operator: In
|
||||||
|
values:
|
||||||
|
- server
|
||||||
containers:
|
containers:
|
||||||
main:
|
main:
|
||||||
image:
|
image:
|
||||||
@@ -59,7 +143,7 @@ ollama:
|
|||||||
name: ollama-web-postgresql-17-cluster-app
|
name: ollama-web-postgresql-17-cluster-app
|
||||||
key: uri
|
key: uri
|
||||||
- name: OLLAMA_BASE_URL
|
- name: OLLAMA_BASE_URL
|
||||||
value: http://ollama-main.ollama:11434
|
value: http://ollama-server-1.ollama:11434
|
||||||
- name: ENABLE_OAUTH_SIGNUP
|
- name: ENABLE_OAUTH_SIGNUP
|
||||||
value: true
|
value: true
|
||||||
- name: OAUTH_USERNAME_CLAIM
|
- name: OAUTH_USERNAME_CLAIM
|
||||||
@@ -85,8 +169,22 @@ ollama:
|
|||||||
serviceAccount:
|
serviceAccount:
|
||||||
create: true
|
create: true
|
||||||
service:
|
service:
|
||||||
main:
|
server-1:
|
||||||
controller: main
|
controller: server-1
|
||||||
|
ports:
|
||||||
|
http:
|
||||||
|
port: 11434
|
||||||
|
targetPort: 11434
|
||||||
|
protocol: HTTP
|
||||||
|
server-2:
|
||||||
|
controller: server-2
|
||||||
|
ports:
|
||||||
|
http:
|
||||||
|
port: 11434
|
||||||
|
targetPort: 11434
|
||||||
|
protocol: HTTP
|
||||||
|
server-3:
|
||||||
|
controller: server-3
|
||||||
ports:
|
ports:
|
||||||
http:
|
http:
|
||||||
port: 11434
|
port: 11434
|
||||||
@@ -115,13 +213,33 @@ ollama:
|
|||||||
hosts:
|
hosts:
|
||||||
- ollama-cl01tl
|
- ollama-cl01tl
|
||||||
persistence:
|
persistence:
|
||||||
root:
|
server-1:
|
||||||
storageClass: ceph-block
|
storageClass: ceph-block-delete
|
||||||
accessMode: ReadWriteOnce
|
accessMode: ReadWriteOnce
|
||||||
size: 100Gi
|
size: 40Gi
|
||||||
retain: true
|
retain: true
|
||||||
advancedMounts:
|
advancedMounts:
|
||||||
main:
|
server-1:
|
||||||
|
main:
|
||||||
|
- path: /root/.ollama
|
||||||
|
readOnly: false
|
||||||
|
server-2:
|
||||||
|
storageClass: ceph-block-delete
|
||||||
|
accessMode: ReadWriteOnce
|
||||||
|
size: 40Gi
|
||||||
|
retain: true
|
||||||
|
advancedMounts:
|
||||||
|
server-2:
|
||||||
|
main:
|
||||||
|
- path: /root/.ollama
|
||||||
|
readOnly: false
|
||||||
|
server-3:
|
||||||
|
storageClass: ceph-block-delete
|
||||||
|
accessMode: ReadWriteOnce
|
||||||
|
size: 40Gi
|
||||||
|
retain: true
|
||||||
|
advancedMounts:
|
||||||
|
server-3:
|
||||||
main:
|
main:
|
||||||
- path: /root/.ollama
|
- path: /root/.ollama
|
||||||
readOnly: false
|
readOnly: false
|
||||||
|
Reference in New Issue
Block a user