diff --git a/clusters/cl01tl/manifests/immich/-.yaml b/clusters/cl01tl/manifests/immich/-.yaml deleted file mode 100644 index 8b1378917..000000000 --- a/clusters/cl01tl/manifests/immich/-.yaml +++ /dev/null @@ -1 +0,0 @@ - diff --git a/clusters/cl01tl/manifests/immich/Cluster-immich-postgresql-18-cluster.yaml b/clusters/cl01tl/manifests/immich/Cluster-immich-postgresql-18-cluster.yaml new file mode 100644 index 000000000..cfeec6e35 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/Cluster-immich-postgresql-18-cluster.yaml @@ -0,0 +1,68 @@ +apiVersion: postgresql.cnpg.io/v1 +kind: Cluster +metadata: + name: immich-postgresql-18-cluster + namespace: immich + labels: + app.kubernetes.io/name: immich-postgresql-18-cluster + helm.sh/chart: postgres-18-cluster-7.12.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "7.12.1" + app.kubernetes.io/managed-by: Helm +spec: + instances: 3 + imageName: "ghcr.io/tensorchord/cloudnative-vectorchord:18.0-0.5.3" + imagePullPolicy: IfNotPresent + postgresUID: 26 + postgresGID: 26 + storage: + size: 10Gi + storageClass: local-path + walStorage: + size: 2Gi + storageClass: local-path + resources: + limits: + hugepages-2Mi: 256Mi + requests: + cpu: 20m + memory: 80Mi + affinity: + enablePodAntiAffinity: true + topologyKey: kubernetes.io/hostname + primaryUpdateMethod: switchover + primaryUpdateStrategy: unsupervised + logLevel: info + enableSuperuserAccess: false + enablePDB: true + postgresql: + shared_preload_libraries: + - vchord.so + parameters: + hot_standby_feedback: "on" + max_slot_wal_keep_size: 2000MB + shared_buffers: 256MB + monitoring: + enablePodMonitor: true + disableDefaultQueries: false + plugins: + - name: barman-cloud.cloudnative-pg.io + enabled: true + isWALArchiver: true + parameters: + barmanObjectName: "immich-postgresql-18-backup-garage-local" + serverName: "immich-postgresql-18-backup-1" + bootstrap: + recovery: + database: app + source: immich-postgresql-18-backup-1 + externalClusters: + - name: immich-postgresql-18-backup-1 + plugin: + name: barman-cloud.cloudnative-pg.io + enabled: true + isWALArchiver: false + parameters: + barmanObjectName: "immich-postgresql-18-recovery" + serverName: immich-postgresql-18-backup-1 diff --git a/clusters/cl01tl/manifests/immich/ConfigMap-immich-valkey-init-scripts.yaml b/clusters/cl01tl/manifests/immich/ConfigMap-immich-valkey-init-scripts.yaml new file mode 100644 index 000000000..6eff7c092 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ConfigMap-immich-valkey-init-scripts.yaml @@ -0,0 +1,87 @@ +apiVersion: v1 +kind: ConfigMap +metadata: + name: immich-valkey-init-scripts + labels: + helm.sh/chart: valkey-0.9.4 + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + app.kubernetes.io/version: "9.0.3" + app.kubernetes.io/managed-by: Helm +data: + init.sh: |- + #!/bin/sh + set -eu + + # Default config paths + VALKEY_CONFIG=${VALKEY_CONFIG_PATH:-/data/conf/valkey.conf} + + LOGFILE="/data/init.log" + DATA_DIR="/data/conf" + + # Logging function (outputs to stderr and file) + log() { + echo "$(date) $1" | tee -a "$LOGFILE" >&2 + } + + # Clean old log if requested + if [ "${KEEP_OLD_LOGS:-false}" != "true" ]; then + rm -f "$LOGFILE" + fi + + if [ -f "$LOGFILE" ]; then + log "Detected restart of this instance ($HOSTNAME)" + fi + + log "Creating configuration in $DATA_DIR..." + mkdir -p "$DATA_DIR" + rm -f "$VALKEY_CONFIG" + + + # Base valkey.conf + log "Generating base valkey.conf" + { + echo "port 6379" + echo "protected-mode no" + echo "bind * -::*" + echo "dir /data" + } >>"$VALKEY_CONFIG" + # Replica mode configuration + log "Configuring replication mode" + + # Use POD_INDEX from Kubernetes metadata + POD_INDEX=${POD_INDEX:-0} + IS_MASTER=false + + # Check if this is pod-0 (master) + if [ "$POD_INDEX" = "0" ]; then + IS_MASTER=true + log "This pod (index $POD_INDEX) is configured as MASTER" + else + log "This pod (index $POD_INDEX) is configured as REPLICA" + fi + + # Configure replica settings + if [ "$IS_MASTER" = "false" ]; then + MASTER_HOST="immich-valkey-0.immich-valkey-headless.immich.svc.cluster.local" + MASTER_PORT="6379" + + log "Configuring replica to follow master at $MASTER_HOST:$MASTER_PORT" + + { + echo "" + echo "# Replica Configuration" + echo "replicaof $MASTER_HOST $MASTER_PORT" + echo "replica-announce-ip immich-valkey-$POD_INDEX.immich-valkey-headless.immich.svc.cluster.local" + } >>"$VALKEY_CONFIG" + fi + + # Append extra configs if present + if [ -f /usr/local/etc/valkey/valkey.conf ]; then + log "Appending /usr/local/etc/valkey/valkey.conf" + cat /usr/local/etc/valkey/valkey.conf >>"$VALKEY_CONFIG" + fi + if [ -d /extravalkeyconfigs ]; then + log "Appending files in /extravalkeyconfigs/" + cat /extravalkeyconfigs/* >>"$VALKEY_CONFIG" + fi diff --git a/clusters/cl01tl/manifests/immich/Deployment-immich.yaml b/clusters/cl01tl/manifests/immich/Deployment-immich.yaml new file mode 100644 index 000000000..545ba0eea --- /dev/null +++ b/clusters/cl01tl/manifests/immich/Deployment-immich.yaml @@ -0,0 +1,125 @@ +apiVersion: apps/v1 +kind: Deployment +metadata: + name: immich + labels: + app.kubernetes.io/controller: main + app.kubernetes.io/instance: immich + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich + helm.sh/chart: immich-4.6.2 + namespace: immich +spec: + revisionHistoryLimit: 3 + replicas: 1 + strategy: + type: Recreate + selector: + matchLabels: + app.kubernetes.io/controller: main + app.kubernetes.io/name: immich + app.kubernetes.io/instance: immich + template: + metadata: + annotations: + checksum/secrets: 46a3f57ca394cccffc419e0c17f5d5f366374b0651c02c507636c53c0b5f33e6 + labels: + app.kubernetes.io/controller: main + app.kubernetes.io/instance: immich + app.kubernetes.io/name: immich + spec: + enableServiceLinks: false + serviceAccountName: immich + automountServiceAccountToken: true + hostIPC: false + hostNetwork: false + hostPID: false + dnsPolicy: ClusterFirst + containers: + - env: + - name: TZ + value: America/Chicago + - name: IMMICH_TELEMETRY_INCLUDE + value: all + - name: IMMICH_CONFIG_FILE + value: /config/immich.json + - name: REDIS_HOSTNAME + value: immich-valkey + - name: DB_VECTOR_EXTENSION + value: vectorchord + - name: DB_HOSTNAME + valueFrom: + secretKeyRef: + key: host + name: immich-postgresql-18-cluster-app + - name: DB_DATABASE_NAME + valueFrom: + secretKeyRef: + key: dbname + name: immich-postgresql-18-cluster-app + - name: DB_PORT + valueFrom: + secretKeyRef: + key: port + name: immich-postgresql-18-cluster-app + - name: DB_USERNAME + valueFrom: + secretKeyRef: + key: user + name: immich-postgresql-18-cluster-app + - name: DB_PASSWORD + valueFrom: + secretKeyRef: + key: password + name: immich-postgresql-18-cluster-app + image: ghcr.io/immich-app/immich-server:v2.7.5@sha256:c15bff75068effb03f4355997d03dc7e0fc58720c2b54ad6f7f10d1bc57efaa5 + livenessProbe: + failureThreshold: 3 + httpGet: + path: /api/server/ping + port: 2283 + initialDelaySeconds: 0 + periodSeconds: 10 + timeoutSeconds: 1 + name: main + readinessProbe: + failureThreshold: 3 + httpGet: + path: /api/server/ping + port: 2283 + initialDelaySeconds: 0 + periodSeconds: 10 + timeoutSeconds: 1 + resources: + limits: + gpu.intel.com/i915: 1 + requests: + cpu: 10m + gpu.intel.com/i915: 1 + memory: 500Mi + startupProbe: + failureThreshold: 30 + httpGet: + path: /api/server/ping + port: 2283 + initialDelaySeconds: 0 + periodSeconds: 10 + timeoutSeconds: 1 + volumeMounts: + - mountPath: /config/immich.json + mountPropagation: None + name: config + readOnly: true + subPath: immich.json + - mountPath: /usr/src/app/upload + name: data + volumes: + - csi: + driver: secrets-store.csi.k8s.io + readOnly: true + volumeAttributes: + secretProviderClass: immich-config + name: config + - name: data + persistentVolumeClaim: + claimName: immich diff --git a/clusters/cl01tl/manifests/immich/ExternalSecret-immich-backup-secret-external.yaml b/clusters/cl01tl/manifests/immich/ExternalSecret-immich-backup-secret-external.yaml new file mode 100644 index 000000000..f0fd469dc --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ExternalSecret-immich-backup-secret-external.yaml @@ -0,0 +1,47 @@ +apiVersion: external-secrets.io/v1 +kind: ExternalSecret +metadata: + name: immich-backup-secret-external + namespace: immich + labels: + helm.sh/chart: volsync-target-data-1.1.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "1.1.1" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich-backup-secret-external +spec: + secretStoreRef: + kind: ClusterSecretStore + name: openbao + target: + template: + mergePolicy: Merge + engineVersion: v2 + data: + RESTIC_REPOSITORY: "s3:{{ .ENDPOINT }}/{{ .BUCKET }}/cl01tl/immich/immich" + data: + - secretKey: ENDPOINT + remoteRef: + key: /digital-ocean/config + property: ENDPOINT + - secretKey: BUCKET + remoteRef: + key: /digital-ocean/home-infra/volsync-backups + property: BUCKET + - secretKey: RESTIC_PASSWORD + remoteRef: + key: /digital-ocean/home-infra/volsync-backups + property: RESTIC_PASSWORD + - secretKey: AWS_DEFAULT_REGION + remoteRef: + key: /digital-ocean/home-infra/volsync-backups + property: AWS_REGION + - secretKey: AWS_ACCESS_KEY_ID + remoteRef: + key: /digital-ocean/home-infra/volsync-backups + property: AWS_ACCESS_KEY_ID + - secretKey: AWS_SECRET_ACCESS_KEY + remoteRef: + key: /digital-ocean/home-infra/volsync-backups + property: AWS_SECRET_ACCESS_KEY diff --git a/clusters/cl01tl/manifests/immich/ExternalSecret-immich-backup-secret-local.yaml b/clusters/cl01tl/manifests/immich/ExternalSecret-immich-backup-secret-local.yaml new file mode 100644 index 000000000..0ee9fe200 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ExternalSecret-immich-backup-secret-local.yaml @@ -0,0 +1,47 @@ +apiVersion: external-secrets.io/v1 +kind: ExternalSecret +metadata: + name: immich-backup-secret-local + namespace: immich + labels: + helm.sh/chart: volsync-target-data-1.1.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "1.1.1" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich-backup-secret-local +spec: + secretStoreRef: + kind: ClusterSecretStore + name: openbao + target: + template: + mergePolicy: Merge + engineVersion: v2 + data: + RESTIC_REPOSITORY: "s3:{{ .ENDPOINT }}/{{ .BUCKET }}/cl01tl/immich/immich" + data: + - secretKey: ENDPOINT + remoteRef: + key: /garage/config + property: ENDPOINT_LOCAL + - secretKey: BUCKET + remoteRef: + key: /garage/home-infra/volsync-backups + property: BUCKET + - secretKey: RESTIC_PASSWORD + remoteRef: + key: /garage/home-infra/volsync-backups + property: RESTIC_PASSWORD_LOCAL + - secretKey: AWS_DEFAULT_REGION + remoteRef: + key: /garage/home-infra/volsync-backups + property: ACCESS_REGION + - secretKey: AWS_ACCESS_KEY_ID + remoteRef: + key: /garage/home-infra/volsync-backups + property: ACCESS_KEY_ID + - secretKey: AWS_SECRET_ACCESS_KEY + remoteRef: + key: /garage/home-infra/volsync-backups + property: ACCESS_SECRET_KEY diff --git a/clusters/cl01tl/manifests/immich/ExternalSecret-immich-backup-secret-remote.yaml b/clusters/cl01tl/manifests/immich/ExternalSecret-immich-backup-secret-remote.yaml new file mode 100644 index 000000000..6c944429c --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ExternalSecret-immich-backup-secret-remote.yaml @@ -0,0 +1,47 @@ +apiVersion: external-secrets.io/v1 +kind: ExternalSecret +metadata: + name: immich-backup-secret-remote + namespace: immich + labels: + helm.sh/chart: volsync-target-data-1.1.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "1.1.1" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich-backup-secret-remote +spec: + secretStoreRef: + kind: ClusterSecretStore + name: openbao + target: + template: + mergePolicy: Merge + engineVersion: v2 + data: + RESTIC_REPOSITORY: "s3:{{ .ENDPOINT }}/{{ .BUCKET }}/cl01tl/immich/immich" + data: + - secretKey: ENDPOINT + remoteRef: + key: /garage/config + property: ENDPOINT_REMOTE + - secretKey: BUCKET + remoteRef: + key: /garage/home-infra/volsync-backups + property: BUCKET + - secretKey: RESTIC_PASSWORD + remoteRef: + key: /garage/home-infra/volsync-backups + property: RESTIC_PASSWORD_REMOTE + - secretKey: AWS_DEFAULT_REGION + remoteRef: + key: /garage/home-infra/volsync-backups + property: ACCESS_REGION + - secretKey: AWS_ACCESS_KEY_ID + remoteRef: + key: /garage/home-infra/volsync-backups + property: ACCESS_KEY_ID + - secretKey: AWS_SECRET_ACCESS_KEY + remoteRef: + key: /garage/home-infra/volsync-backups + property: ACCESS_SECRET_KEY diff --git a/clusters/cl01tl/manifests/immich/ExternalSecret-immich-postgresql-18-backup-garage-local-secret.yaml b/clusters/cl01tl/manifests/immich/ExternalSecret-immich-postgresql-18-backup-garage-local-secret.yaml new file mode 100644 index 000000000..872987bdb --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ExternalSecret-immich-postgresql-18-backup-garage-local-secret.yaml @@ -0,0 +1,29 @@ +apiVersion: external-secrets.io/v1 +kind: ExternalSecret +metadata: + name: immich-postgresql-18-backup-garage-local-secret + namespace: immich + labels: + app.kubernetes.io/name: immich-postgresql-18-backup-garage-local-secret + helm.sh/chart: postgres-18-cluster-7.12.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "7.12.1" + app.kubernetes.io/managed-by: Helm +spec: + secretStoreRef: + kind: ClusterSecretStore + name: openbao + data: + - secretKey: ACCESS_REGION + remoteRef: + key: /garage/home-infra/postgres-backups + property: ACCESS_REGION + - secretKey: ACCESS_KEY_ID + remoteRef: + key: /garage/home-infra/postgres-backups + property: ACCESS_KEY_ID + - secretKey: ACCESS_SECRET_KEY + remoteRef: + key: /garage/home-infra/postgres-backups + property: ACCESS_SECRET_KEY diff --git a/clusters/cl01tl/manifests/immich/ExternalSecret-immich-postgresql-18-recovery-secret.yaml b/clusters/cl01tl/manifests/immich/ExternalSecret-immich-postgresql-18-recovery-secret.yaml new file mode 100644 index 000000000..4032effcb --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ExternalSecret-immich-postgresql-18-recovery-secret.yaml @@ -0,0 +1,29 @@ +apiVersion: external-secrets.io/v1 +kind: ExternalSecret +metadata: + name: immich-postgresql-18-recovery-secret + namespace: immich + labels: + helm.sh/chart: postgres-18-cluster-7.12.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "7.12.1" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich-postgresql-18-recovery-secret +spec: + secretStoreRef: + kind: ClusterSecretStore + name: openbao + data: + - secretKey: ACCESS_REGION + remoteRef: + key: /garage/home-infra/postgres-backups + property: ACCESS_REGION + - secretKey: ACCESS_KEY_ID + remoteRef: + key: /garage/home-infra/postgres-backups + property: ACCESS_KEY_ID + - secretKey: ACCESS_SECRET_KEY + remoteRef: + key: /garage/home-infra/postgres-backups + property: ACCESS_SECRET_KEY diff --git a/clusters/cl01tl/manifests/immich/HTTPRoute-immich.yaml b/clusters/cl01tl/manifests/immich/HTTPRoute-immich.yaml new file mode 100644 index 000000000..b8475cbe9 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/HTTPRoute-immich.yaml @@ -0,0 +1,30 @@ +apiVersion: gateway.networking.k8s.io/v1 +kind: HTTPRoute +metadata: + name: immich + labels: + app.kubernetes.io/instance: immich + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich + helm.sh/chart: immich-4.6.2 + namespace: immich +spec: + parentRefs: + - group: gateway.networking.k8s.io + kind: Gateway + name: traefik-gateway + namespace: traefik + hostnames: + - "immich.alexlebens.net" + rules: + - backendRefs: + - group: "" + kind: Service + name: immich + namespace: immich + port: 2283 + weight: 1 + matches: + - path: + type: PathPrefix + value: / diff --git a/clusters/cl01tl/manifests/immich/ObjectStore-immich-postgresql-18-backup-garage-local.yaml b/clusters/cl01tl/manifests/immich/ObjectStore-immich-postgresql-18-backup-garage-local.yaml new file mode 100644 index 000000000..2a0852f0c --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ObjectStore-immich-postgresql-18-backup-garage-local.yaml @@ -0,0 +1,33 @@ +apiVersion: barmancloud.cnpg.io/v1 +kind: ObjectStore +metadata: + name: immich-postgresql-18-backup-garage-local + namespace: immich + labels: + app.kubernetes.io/name: immich-postgresql-18-backup-garage-local + helm.sh/chart: postgres-18-cluster-7.12.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "7.12.1" + app.kubernetes.io/managed-by: Helm +spec: + retentionPolicy: 7d + instanceSidecarConfiguration: + env: + - name: AWS_REQUEST_CHECKSUM_CALCULATION + value: when_required + - name: AWS_RESPONSE_CHECKSUM_VALIDATION + value: when_required + configuration: + destinationPath: s3://postgres-backups/cl01tl/immich/immich-postgresql-18-cluster + endpointURL: http://garage-main.garage:3900 + s3Credentials: + accessKeyId: + name: immich-postgresql-18-backup-garage-local-secret + key: ACCESS_KEY_ID + secretAccessKey: + name: immich-postgresql-18-backup-garage-local-secret + key: ACCESS_SECRET_KEY + region: + name: immich-postgresql-18-backup-garage-local-secret + key: ACCESS_REGION diff --git a/clusters/cl01tl/manifests/immich/ObjectStore-immich-postgresql-18-recovery.yaml b/clusters/cl01tl/manifests/immich/ObjectStore-immich-postgresql-18-recovery.yaml new file mode 100644 index 000000000..2c0f41c0e --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ObjectStore-immich-postgresql-18-recovery.yaml @@ -0,0 +1,32 @@ +apiVersion: barmancloud.cnpg.io/v1 +kind: ObjectStore +metadata: + name: "immich-postgresql-18-recovery" + namespace: immich + labels: + helm.sh/chart: postgres-18-cluster-7.12.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "7.12.1" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: "immich-postgresql-18-recovery" +spec: + configuration: + destinationPath: s3://postgres-backups/cl01tl/immich/immich-postgresql-18-cluster + endpointURL: http://garage-main.garage:3900 + wal: + compression: snappy + maxParallel: 1 + data: + compression: snappy + jobs: 1 + s3Credentials: + accessKeyId: + name: immich-postgresql-18-recovery-secret + key: ACCESS_KEY_ID + secretAccessKey: + name: immich-postgresql-18-recovery-secret + key: ACCESS_SECRET_KEY + region: + name: immich-postgresql-18-recovery-secret + key: ACCESS_REGION diff --git a/clusters/cl01tl/manifests/immich/PersistentVolumeClaim-immich.yaml b/clusters/cl01tl/manifests/immich/PersistentVolumeClaim-immich.yaml new file mode 100644 index 000000000..0ad202dd2 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/PersistentVolumeClaim-immich.yaml @@ -0,0 +1,19 @@ +kind: PersistentVolumeClaim +apiVersion: v1 +metadata: + name: immich + labels: + app.kubernetes.io/instance: immich + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich + helm.sh/chart: immich-4.6.2 + annotations: + helm.sh/resource-policy: keep + namespace: immich +spec: + accessModes: + - "ReadWriteOnce" + resources: + requests: + storage: "50Gi" + storageClassName: "ceph-block" diff --git a/clusters/cl01tl/manifests/immich/PodMonitor-immich-valkey.yaml b/clusters/cl01tl/manifests/immich/PodMonitor-immich-valkey.yaml new file mode 100644 index 000000000..de18b8537 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/PodMonitor-immich-valkey.yaml @@ -0,0 +1,23 @@ +apiVersion: monitoring.coreos.com/v1 +kind: PodMonitor +metadata: + name: immich-valkey + labels: + helm.sh/chart: valkey-0.9.4 + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + app.kubernetes.io/version: "9.0.3" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/part-of: valkey + app.kubernetes.io/component: podmonitor +spec: + podMetricsEndpoints: + - port: metrics + interval: 30s + namespaceSelector: + matchNames: + - immich + selector: + matchLabels: + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich diff --git a/clusters/cl01tl/manifests/immich/PrometheusRule-immich-backup-source-local.yaml b/clusters/cl01tl/manifests/immich/PrometheusRule-immich-backup-source-local.yaml new file mode 100644 index 000000000..a476eddd7 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/PrometheusRule-immich-backup-source-local.yaml @@ -0,0 +1,30 @@ +apiVersion: monitoring.coreos.com/v1 +kind: PrometheusRule +metadata: + name: immich-backup-source-local + namespace: immich + labels: + helm.sh/chart: volsync-target-data-1.1.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "1.1.1" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich-backup-source-local +spec: + groups: + - name: volsync.alerts + rules: + - alert: VolSyncBackupPodFailed + expr: | + (kube_pod_container_status_last_terminated_exitcode > 0) + * on(pod, namespace) group_left(owner_name) + kube_pod_owner{owner_kind="Job", owner_name=~"volsync-.*"} + for: 1m + labels: + severity: critical + annotations: + summary: "VolSync Backup Pod failed in {{ $labels.namespace }}" + description: | + A pod for the VolSync backup of PVC 'immich' failed with exit code {{ $value }}. + Job: {{ $labels.owner_name }} + Namespace: {{ $labels.namespace }} diff --git a/clusters/cl01tl/manifests/immich/PrometheusRule-immich-postgresql-18-alert-rules.yaml b/clusters/cl01tl/manifests/immich/PrometheusRule-immich-postgresql-18-alert-rules.yaml new file mode 100644 index 000000000..6d5b90393 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/PrometheusRule-immich-postgresql-18-alert-rules.yaml @@ -0,0 +1,270 @@ +apiVersion: monitoring.coreos.com/v1 +kind: PrometheusRule +metadata: + name: immich-postgresql-18-alert-rules + namespace: immich + labels: + app.kubernetes.io/name: immich-postgresql-18-alert-rules + helm.sh/chart: postgres-18-cluster-7.12.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "7.12.1" + app.kubernetes.io/managed-by: Helm +spec: + groups: + - name: cloudnative-pg/immich-postgresql-18 + rules: + - alert: CNPGClusterBackendsWaitingWarning + annotations: + summary: CNPG Cluster a backend is waiting for longer than 5 minutes. + description: |- + Pod {{ $labels.pod }} + has been waiting for longer than 5 minutes + expr: | + cnpg_backends_waiting_total{namespace="immich"} > 300 + for: 1m + labels: + severity: warning + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterDatabaseDeadlockConflictsWarning + annotations: + summary: CNPG Cluster has over 10 deadlock conflicts. + description: |- + There are over 10 deadlock conflicts in + {{ $labels.pod }} + expr: | + cnpg_pg_stat_database_deadlocks{namespace="immich"} > 10 + for: 1m + labels: + severity: warning + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterHACritical + annotations: + summary: CNPG Cluster has no standby replicas! + description: |- + CloudNativePG Cluster "{{`{{`}} $labels.job {{`}}`}}" has no ready standby replicas. Your cluster at a severe + risk of data loss and downtime if the primary instance fails. + + The primary instance is still online and able to serve queries, although connections to the `-ro` endpoint + will fail. The `-r` endpoint os operating at reduced capacity and all traffic is being served by the main. + + This can happen during a normal fail-over or automated minor version upgrades in a cluster with 2 or less + instances. The replaced instance may need some time to catch-up with the cluster primary instance. + + This alarm will be always trigger if your cluster is configured to run with only 1 instance. In this + case you may want to silence it. + runbook_url: https://github.com/cloudnative-pg/charts/blob/main/charts/cluster/docs/runbooks/CNPGClusterHACritical.md + expr: | + max by (job) (cnpg_pg_replication_streaming_replicas{namespace="immich"} - cnpg_pg_replication_is_wal_receiver_up{namespace="immich"}) < 1 + for: 5m + labels: + severity: critical + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterHAWarning + annotations: + summary: CNPG Cluster less than 2 standby replicas. + description: |- + CloudNativePG Cluster "{{`{{`}} $labels.job {{`}}`}}" has only {{`{{`}} $value {{`}}`}} standby replicas, putting + your cluster at risk if another instance fails. The cluster is still able to operate normally, although + the `-ro` and `-r` endpoints operate at reduced capacity. + + This can happen during a normal fail-over or automated minor version upgrades. The replaced instance may + need some time to catch-up with the cluster primary instance. + + This alarm will be constantly triggered if your cluster is configured to run with less than 3 instances. + In this case you may want to silence it. + runbook_url: https://github.com/cloudnative-pg/charts/blob/main/charts/cluster/docs/runbooks/CNPGClusterHAWarning.md + expr: | + max by (job) (cnpg_pg_replication_streaming_replicas{namespace="immich"} - cnpg_pg_replication_is_wal_receiver_up{namespace="immich"}) < 2 + for: 5m + labels: + severity: warning + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterHighConnectionsCritical + annotations: + summary: CNPG Instance maximum number of connections critical! + description: |- + CloudNativePG Cluster "immich/immich-postgresql-18-cluster" instance {{`{{`}} $labels.pod {{`}}`}} is using {{`{{`}} $value {{`}}`}}% of + the maximum number of connections. + runbook_url: https://github.com/cloudnative-pg/charts/blob/main/charts/cluster/docs/runbooks/CNPGClusterHighConnectionsCritical.md + expr: | + sum by (pod) (cnpg_backends_total{namespace="immich", pod=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"}) / max by (pod) (cnpg_pg_settings_setting{name="max_connections", namespace="immich", pod=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"}) * 100 > 95 + for: 5m + labels: + severity: critical + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterHighConnectionsWarning + annotations: + summary: CNPG Instance is approaching the maximum number of connections. + description: |- + CloudNativePG Cluster "immich/immich-postgresql-18-cluster" instance {{`{{`}} $labels.pod {{`}}`}} is using {{`{{`}} $value {{`}}`}}% of + the maximum number of connections. + runbook_url: https://github.com/cloudnative-pg/charts/blob/main/charts/cluster/docs/runbooks/CNPGClusterHighConnectionsWarning.md + expr: | + sum by (pod) (cnpg_backends_total{namespace="immich", pod=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"}) / max by (pod) (cnpg_pg_settings_setting{name="max_connections", namespace="immich", pod=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"}) * 100 > 80 + for: 5m + labels: + severity: warning + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterHighReplicationLag + annotations: + summary: CNPG Cluster high replication lag + description: |- + CloudNativePG Cluster "immich/immich-postgresql-18-cluster" is experiencing a high replication lag of + {{`{{`}} $value {{`}}`}}ms. + + High replication lag indicates network issues, busy instances, slow queries or suboptimal configuration. + runbook_url: https://github.com/cloudnative-pg/charts/blob/main/charts/cluster/docs/runbooks/CNPGClusterHighReplicationLag.md + expr: | + max(cnpg_pg_replication_lag{namespace="immich",pod=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"}) * 1000 > 1000 + for: 5m + labels: + severity: warning + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterInstancesOnSameNode + annotations: + summary: CNPG Cluster instances are located on the same node. + description: |- + CloudNativePG Cluster "immich/immich-postgresql-18-cluster" has {{`{{`}} $value {{`}}`}} + instances on the same node {{`{{`}} $labels.node {{`}}`}}. + + A failure or scheduled downtime of a single node will lead to a potential service disruption and/or data loss. + runbook_url: https://github.com/cloudnative-pg/charts/blob/main/charts/cluster/docs/runbooks/CNPGClusterInstancesOnSameNode.md + expr: | + count by (node) (kube_pod_info{namespace="immich", pod=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"}) > 1 + for: 5m + labels: + severity: warning + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterLongRunningTransactionWarning + annotations: + summary: CNPG Cluster query is taking longer than 5 minutes. + description: |- + CloudNativePG Cluster Pod {{ $labels.pod }} + is taking more than 5 minutes (300 seconds) for a query. + expr: |- + cnpg_backends_max_tx_duration_seconds{namespace="immich"} > 300 + for: 1m + labels: + severity: warning + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterLowDiskSpaceCritical + annotations: + summary: CNPG Instance is running out of disk space! + description: |- + CloudNativePG Cluster "immich/immich-postgresql-18-cluster" is running extremely low on disk space. Check attached PVCs! + runbook_url: https://github.com/cloudnative-pg/charts/blob/main/charts/cluster/docs/runbooks/CNPGClusterLowDiskSpaceCritical.md + expr: | + max(max by(persistentvolumeclaim) (1 - kubelet_volume_stats_available_bytes{namespace="immich", persistentvolumeclaim=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"} / kubelet_volume_stats_capacity_bytes{namespace="immich", persistentvolumeclaim=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"})) > 0.9 OR + max(max by(persistentvolumeclaim) (1 - kubelet_volume_stats_available_bytes{namespace="immich", persistentvolumeclaim=~"immich-postgresql-18-cluster-([1-9][0-9]*)$-wal"} / kubelet_volume_stats_capacity_bytes{namespace="immich", persistentvolumeclaim=~"immich-postgresql-18-cluster-([1-9][0-9]*)$-wal"})) > 0.9 OR + max(sum by (namespace,persistentvolumeclaim) (kubelet_volume_stats_used_bytes{namespace="immich", persistentvolumeclaim=~"immich-postgresql-18-cluster-([1-9][0-9]*)$-tbs.*"}) + / + sum by (namespace,persistentvolumeclaim) (kubelet_volume_stats_capacity_bytes{namespace="immich", persistentvolumeclaim=~"immich-postgresql-18-cluster-([1-9][0-9]*)$-tbs.*"}) + * + on(namespace, persistentvolumeclaim) group_left(volume) + kube_pod_spec_volumes_persistentvolumeclaims_info{pod=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"} + ) > 0.9 + for: 5m + labels: + severity: critical + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterLowDiskSpaceWarning + annotations: + summary: CNPG Instance is running out of disk space. + description: |- + CloudNativePG Cluster "immich/immich-postgresql-18-cluster" is running low on disk space. Check attached PVCs. + runbook_url: https://github.com/cloudnative-pg/charts/blob/main/charts/cluster/docs/runbooks/CNPGClusterLowDiskSpaceWarning.md + expr: | + max(max by(persistentvolumeclaim) (1 - kubelet_volume_stats_available_bytes{namespace="immich", persistentvolumeclaim=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"} / kubelet_volume_stats_capacity_bytes{namespace="immich", persistentvolumeclaim=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"})) > 0.7 OR + max(max by(persistentvolumeclaim) (1 - kubelet_volume_stats_available_bytes{namespace="immich", persistentvolumeclaim=~"immich-postgresql-18-cluster-([1-9][0-9]*)$-wal"} / kubelet_volume_stats_capacity_bytes{namespace="immich", persistentvolumeclaim=~"immich-postgresql-18-cluster-([1-9][0-9]*)$-wal"})) > 0.7 OR + max(sum by (namespace,persistentvolumeclaim) (kubelet_volume_stats_used_bytes{namespace="immich", persistentvolumeclaim=~"immich-postgresql-18-cluster-([1-9][0-9]*)$-tbs.*"}) + / + sum by (namespace,persistentvolumeclaim) (kubelet_volume_stats_capacity_bytes{namespace="immich", persistentvolumeclaim=~"immich-postgresql-18-cluster-([1-9][0-9]*)$-tbs.*"}) + * + on(namespace, persistentvolumeclaim) group_left(volume) + kube_pod_spec_volumes_persistentvolumeclaims_info{pod=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"} + ) > 0.7 + for: 5m + labels: + severity: warning + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterOffline + annotations: + summary: CNPG Cluster has no running instances! + description: |- + CloudNativePG Cluster "immich/immich-postgresql-18-cluster" has no ready instances. + + Having an offline cluster means your applications will not be able to access the database, leading to + potential service disruption and/or data loss. + runbook_url: https://github.com/cloudnative-pg/charts/blob/main/charts/cluster/docs/runbooks/CNPGClusterOffline.md + expr: | + (count(cnpg_collector_up{namespace="immich",pod=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"}) OR on() vector(0)) == 0 + for: 5m + labels: + severity: critical + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterPGDatabaseXidAgeWarning + annotations: + summary: CNPG Cluster has a number of transactions from the frozen XID to the current one. + description: |- + Over 300,000,000 transactions from frozen xid + on pod {{ $labels.pod }} + expr: | + cnpg_pg_database_xid_age{namespace="immich"} > 300000000 + for: 1m + labels: + severity: warning + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterPGReplicationWarning + annotations: + summary: CNPG Cluster standby is lagging behind the primary. + description: |- + Standby is lagging behind by over 300 seconds (5 minutes) + expr: | + cnpg_pg_replication_lag{namespace="immich"} > 300 + for: 1m + labels: + severity: warning + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterReplicaFailingReplicationWarning + annotations: + summary: CNPG Cluster has a replica is failing to replicate. + description: |- + Replica {{ $labels.pod }} + is failing to replicate + expr: | + cnpg_pg_replication_in_recovery{namespace="immich"} > cnpg_pg_replication_is_wal_receiver_up{namespace="immich"} + for: 1m + labels: + severity: warning + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster + - alert: CNPGClusterZoneSpreadWarning + annotations: + summary: CNPG Cluster instances in the same zone. + description: |- + CloudNativePG Cluster "immich/immich-postgresql-18-cluster" has instances in the same availability zone. + + A disaster in one availability zone will lead to a potential service disruption and/or data loss. + runbook_url: https://github.com/cloudnative-pg/charts/blob/main/charts/cluster/docs/runbooks/CNPGClusterZoneSpreadWarning.md + expr: | + 3 > count(count by (label_topology_kubernetes_io_zone) (kube_pod_info{namespace="immich", pod=~"immich-postgresql-18-cluster-([1-9][0-9]*)$"} * on(node,instance) group_left(label_topology_kubernetes_io_zone) kube_node_labels)) < 3 + for: 5m + labels: + severity: warning + namespace: immich + cnpg_cluster: immich-postgresql-18-cluster diff --git a/clusters/cl01tl/manifests/immich/PrometheusRule-immich-valkey.yaml b/clusters/cl01tl/manifests/immich/PrometheusRule-immich-valkey.yaml new file mode 100644 index 000000000..bc042f70f --- /dev/null +++ b/clusters/cl01tl/manifests/immich/PrometheusRule-immich-valkey.yaml @@ -0,0 +1,47 @@ +apiVersion: monitoring.coreos.com/v1 +kind: PrometheusRule +metadata: + name: immich-valkey + labels: + helm.sh/chart: valkey-0.9.4 + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + app.kubernetes.io/version: "9.0.3" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/part-of: valkey +spec: + groups: + - name: immich-valkey + rules: + - alert: ValkeyDown + annotations: + description: Valkey instance {{ $labels.instance }} is down. + summary: Valkey instance {{ $labels.instance }} down + expr: | + redis_up{service="immich-valkey-metrics"} == 0 + for: 2m + labels: + severity: error + - alert: ValkeyMemoryHigh + annotations: + description: | + Valkey instance {{ $labels.instance }} is using {{ $value }}% of its available memory. + summary: Valkey instance {{ $labels.instance }} is using too much memory + expr: | + redis_memory_used_bytes{service="immich-valkey-metrics"} * 100 + / + redis_memory_max_bytes{service="immich-valkey-metrics"} + > 90 <= 100 + for: 2m + labels: + severity: error + - alert: ValkeyKeyEviction + annotations: + description: | + Valkey instance {{ $labels.instance }} has evicted {{ $value }} keys in the last 5 minutes. + summary: Valkey instance {{ $labels.instance }} has evicted keys + expr: | + increase(redis_evicted_keys_total{service="immich-valkey-metrics"}[5m]) > 0 + for: 1s + labels: + severity: error diff --git a/clusters/cl01tl/manifests/immich/ReplicationSource-immich-backup-source-external.yaml b/clusters/cl01tl/manifests/immich/ReplicationSource-immich-backup-source-external.yaml new file mode 100644 index 000000000..6de3c1df5 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ReplicationSource-immich-backup-source-external.yaml @@ -0,0 +1,29 @@ +apiVersion: volsync.backube/v1alpha1 +kind: ReplicationSource +metadata: + name: immich-backup-source-external + namespace: immich + labels: + helm.sh/chart: volsync-target-data-1.1.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "1.1.1" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich-backup +spec: + sourcePVC: immich + trigger: + schedule: 24 10 * * * + restic: + pruneIntervalDays: 7 + repository: immich-backup-secret-external + retain: + daily: 7 + hourly: 0 + monthly: 3 + weekly: 4 + yearly: 1 + copyMethod: Snapshot + storageClassName: ceph-block + volumeSnapshotClassName: ceph-blockpool-snapshot + cacheCapacity: 10Gi diff --git a/clusters/cl01tl/manifests/immich/ReplicationSource-immich-backup-source-local.yaml b/clusters/cl01tl/manifests/immich/ReplicationSource-immich-backup-source-local.yaml new file mode 100644 index 000000000..248145b53 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ReplicationSource-immich-backup-source-local.yaml @@ -0,0 +1,29 @@ +apiVersion: volsync.backube/v1alpha1 +kind: ReplicationSource +metadata: + name: immich-backup-source-local + namespace: immich + labels: + helm.sh/chart: volsync-target-data-1.1.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "1.1.1" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich-backup-source-local +spec: + sourcePVC: immich + trigger: + schedule: 24 8 * * * + restic: + pruneIntervalDays: 7 + repository: immich-backup-secret-local + retain: + daily: 7 + hourly: 0 + monthly: 3 + weekly: 4 + yearly: 1 + copyMethod: Snapshot + storageClassName: ceph-block + volumeSnapshotClassName: ceph-blockpool-snapshot + cacheCapacity: 10Gi diff --git a/clusters/cl01tl/manifests/immich/ReplicationSource-immich-backup-source-remote.yaml b/clusters/cl01tl/manifests/immich/ReplicationSource-immich-backup-source-remote.yaml new file mode 100644 index 000000000..970c20e74 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ReplicationSource-immich-backup-source-remote.yaml @@ -0,0 +1,29 @@ +apiVersion: volsync.backube/v1alpha1 +kind: ReplicationSource +metadata: + name: immich-backup-source-remote + namespace: immich + labels: + helm.sh/chart: volsync-target-data-1.1.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "1.1.1" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich-backup +spec: + sourcePVC: immich + trigger: + schedule: 24 9 * * * + restic: + pruneIntervalDays: 7 + repository: immich-backup-secret-remote + retain: + daily: 7 + hourly: 0 + monthly: 3 + weekly: 4 + yearly: 1 + copyMethod: Snapshot + storageClassName: ceph-block + volumeSnapshotClassName: ceph-blockpool-snapshot + cacheCapacity: 10Gi diff --git a/clusters/cl01tl/manifests/immich/ScheduledBackup-immich-postgresql-18-scheduled-backup-live-backup.yaml b/clusters/cl01tl/manifests/immich/ScheduledBackup-immich-postgresql-18-scheduled-backup-live-backup.yaml new file mode 100644 index 000000000..6f18a8a5b --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ScheduledBackup-immich-postgresql-18-scheduled-backup-live-backup.yaml @@ -0,0 +1,24 @@ +apiVersion: postgresql.cnpg.io/v1 +kind: ScheduledBackup +metadata: + name: "immich-postgresql-18-scheduled-backup-live-backup" + namespace: immich + labels: + app.kubernetes.io/name: "immich-postgresql-18-scheduled-backup-live-backup" + helm.sh/chart: postgres-18-cluster-7.12.1 + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich + app.kubernetes.io/version: "7.12.1" + app.kubernetes.io/managed-by: Helm +spec: + immediate: true + suspend: false + schedule: "0 40 14 * * *" + backupOwnerReference: self + cluster: + name: immich-postgresql-18-cluster + method: plugin + pluginConfiguration: + name: barman-cloud.cloudnative-pg.io + parameters: + barmanObjectName: "immich-postgresql-18-backup-garage-local" diff --git a/clusters/cl01tl/manifests/immich/Secret-immich-immich-sa-token.yaml b/clusters/cl01tl/manifests/immich/Secret-immich-immich-sa-token.yaml new file mode 100644 index 000000000..2628b39fd --- /dev/null +++ b/clusters/cl01tl/manifests/immich/Secret-immich-immich-sa-token.yaml @@ -0,0 +1,13 @@ +apiVersion: v1 +kind: Secret +type: kubernetes.io/service-account-token +metadata: + name: immich-immich-sa-token + labels: + app.kubernetes.io/instance: immich + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich + helm.sh/chart: immich-4.6.2 + annotations: + kubernetes.io/service-account.name: immich + namespace: immich diff --git a/clusters/cl01tl/manifests/immich/SecretProviderClass-immich-config.yaml b/clusters/cl01tl/manifests/immich/SecretProviderClass-immich-config.yaml new file mode 100644 index 000000000..d1c78ea57 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/SecretProviderClass-immich-config.yaml @@ -0,0 +1,19 @@ +apiVersion: secrets-store.csi.x-k8s.io/v1 +kind: SecretProviderClass +metadata: + name: immich-config + namespace: immich + labels: + app.kubernetes.io/name: immich-config + app.kubernetes.io/instance: immich + app.kubernetes.io/part-of: immich +spec: + provider: openbao + parameters: + baoAddress: "http://openbao-internal.openbao:8200" + roleName: immich + objects: | + - objectName: immich.json + fileName: immich.json + secretPath: secret/data/cl01tl/immich/config + secretKey: immich.json diff --git a/clusters/cl01tl/manifests/immich/Service-immich-valkey-headless.yaml b/clusters/cl01tl/manifests/immich/Service-immich-valkey-headless.yaml new file mode 100644 index 000000000..1b5dcb00a --- /dev/null +++ b/clusters/cl01tl/manifests/immich/Service-immich-valkey-headless.yaml @@ -0,0 +1,23 @@ +apiVersion: v1 +kind: Service +metadata: + name: immich-valkey-headless + labels: + helm.sh/chart: valkey-0.9.4 + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + app.kubernetes.io/version: "9.0.3" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/component: headless +spec: + type: ClusterIP + clusterIP: None + publishNotReadyAddresses: true + ports: + - name: tcp + port: 6379 + targetPort: tcp + protocol: TCP + selector: + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich diff --git a/clusters/cl01tl/manifests/immich/Service-immich-valkey-metrics.yaml b/clusters/cl01tl/manifests/immich/Service-immich-valkey-metrics.yaml new file mode 100644 index 000000000..ff6de0460 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/Service-immich-valkey-metrics.yaml @@ -0,0 +1,23 @@ +apiVersion: v1 +kind: Service +metadata: + name: immich-valkey-metrics + labels: + helm.sh/chart: valkey-0.9.4 + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + app.kubernetes.io/version: "9.0.3" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/component: metrics + app.kubernetes.io/part-of: valkey + annotations: +spec: + type: ClusterIP + ports: + - name: metrics + port: 9121 + protocol: TCP + targetPort: metrics + selector: + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich diff --git a/clusters/cl01tl/manifests/immich/Service-immich-valkey-read.yaml b/clusters/cl01tl/manifests/immich/Service-immich-valkey-read.yaml new file mode 100644 index 000000000..e91c2856b --- /dev/null +++ b/clusters/cl01tl/manifests/immich/Service-immich-valkey-read.yaml @@ -0,0 +1,21 @@ +apiVersion: v1 +kind: Service +metadata: + name: immich-valkey-read + labels: + helm.sh/chart: valkey-0.9.4 + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + app.kubernetes.io/version: "9.0.3" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/component: read +spec: + type: ClusterIP + ports: + - name: tcp + port: 6379 + targetPort: tcp + protocol: TCP + selector: + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich diff --git a/clusters/cl01tl/manifests/immich/Service-immich-valkey.yaml b/clusters/cl01tl/manifests/immich/Service-immich-valkey.yaml new file mode 100644 index 000000000..1f4852319 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/Service-immich-valkey.yaml @@ -0,0 +1,22 @@ +apiVersion: v1 +kind: Service +metadata: + name: immich-valkey + labels: + helm.sh/chart: valkey-0.9.4 + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + app.kubernetes.io/version: "9.0.3" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/component: primary +spec: + type: ClusterIP + ports: + - port: 6379 + targetPort: tcp + protocol: TCP + name: tcp + selector: + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + statefulset.kubernetes.io/pod-name: immich-valkey-0 diff --git a/clusters/cl01tl/manifests/immich/Service-immich.yaml b/clusters/cl01tl/manifests/immich/Service-immich.yaml new file mode 100644 index 000000000..fb0158a83 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/Service-immich.yaml @@ -0,0 +1,30 @@ +apiVersion: v1 +kind: Service +metadata: + name: immich + labels: + app.kubernetes.io/instance: immich + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich + app.kubernetes.io/service: immich + helm.sh/chart: immich-4.6.2 + namespace: immich +spec: + type: ClusterIP + ports: + - port: 2283 + targetPort: 2283 + protocol: TCP + name: http + - port: 8081 + targetPort: 8081 + protocol: TCP + name: metrics-api + - port: 8082 + targetPort: 8082 + protocol: TCP + name: metrics-ms + selector: + app.kubernetes.io/controller: main + app.kubernetes.io/instance: immich + app.kubernetes.io/name: immich diff --git a/clusters/cl01tl/manifests/immich/ServiceAccount-immich-valkey.yaml b/clusters/cl01tl/manifests/immich/ServiceAccount-immich-valkey.yaml new file mode 100644 index 000000000..d1e7d95df --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ServiceAccount-immich-valkey.yaml @@ -0,0 +1,11 @@ +apiVersion: v1 +kind: ServiceAccount +metadata: + name: immich-valkey + labels: + helm.sh/chart: valkey-0.9.4 + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + app.kubernetes.io/version: "9.0.3" + app.kubernetes.io/managed-by: Helm +automountServiceAccountToken: false diff --git a/clusters/cl01tl/manifests/immich/ServiceAccount-immich.yaml b/clusters/cl01tl/manifests/immich/ServiceAccount-immich.yaml new file mode 100644 index 000000000..4c94fbe57 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ServiceAccount-immich.yaml @@ -0,0 +1,12 @@ +apiVersion: v1 +kind: ServiceAccount +metadata: + name: immich + labels: + app.kubernetes.io/instance: immich + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich + helm.sh/chart: immich-4.6.2 + namespace: immich +secrets: + - name: immich-immich-sa-token diff --git a/clusters/cl01tl/manifests/immich/ServiceMonitor-immich-valkey.yaml b/clusters/cl01tl/manifests/immich/ServiceMonitor-immich-valkey.yaml new file mode 100644 index 000000000..631397d43 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ServiceMonitor-immich-valkey.yaml @@ -0,0 +1,24 @@ +apiVersion: monitoring.coreos.com/v1 +kind: ServiceMonitor +metadata: + name: immich-valkey + labels: + helm.sh/chart: valkey-0.9.4 + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + app.kubernetes.io/version: "9.0.3" + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/part-of: valkey + app.kubernetes.io/component: service-monitor +spec: + endpoints: + - port: metrics + interval: 30s + namespaceSelector: + matchNames: + - immich + selector: + matchLabels: + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + app.kubernetes.io/component: metrics diff --git a/clusters/cl01tl/manifests/immich/ServiceMonitor-immich.yaml b/clusters/cl01tl/manifests/immich/ServiceMonitor-immich.yaml new file mode 100644 index 000000000..2e4deea17 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/ServiceMonitor-immich.yaml @@ -0,0 +1,28 @@ +apiVersion: monitoring.coreos.com/v1 +kind: ServiceMonitor +metadata: + name: immich + labels: + app.kubernetes.io/instance: immich + app.kubernetes.io/managed-by: Helm + app.kubernetes.io/name: immich + helm.sh/chart: immich-4.6.2 + namespace: immich +spec: + jobLabel: immich + namespaceSelector: + matchNames: + - immich + selector: + matchLabels: + app.kubernetes.io/instance: immich + app.kubernetes.io/name: immich + endpoints: + - interval: 3m + path: /metrics + port: metrics-api + scrapeTimeout: 1m + - interval: 3m + path: /metrics + port: metrics-ms + scrapeTimeout: 1m diff --git a/clusters/cl01tl/manifests/immich/StatefulSet-immich-valkey.yaml b/clusters/cl01tl/manifests/immich/StatefulSet-immich-valkey.yaml new file mode 100644 index 000000000..993c7cda2 --- /dev/null +++ b/clusters/cl01tl/manifests/immich/StatefulSet-immich-valkey.yaml @@ -0,0 +1,133 @@ +apiVersion: apps/v1 +kind: StatefulSet +metadata: + name: immich-valkey + labels: + helm.sh/chart: valkey-0.9.4 + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + app.kubernetes.io/version: "9.0.3" + app.kubernetes.io/managed-by: Helm +spec: + serviceName: immich-valkey-headless + replicas: 3 + podManagementPolicy: OrderedReady + selector: + matchLabels: + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + volumeClaimTemplates: + - metadata: + name: valkey-data + spec: + accessModes: + - ReadWriteOnce + storageClassName: "ceph-block" + resources: + requests: + storage: "1Gi" + template: + metadata: + labels: + app.kubernetes.io/name: valkey + app.kubernetes.io/instance: immich + annotations: + checksum/initconfig: "2d8432be19db9efa32b993becf4e58d4" + spec: + automountServiceAccountToken: false + serviceAccountName: immich-valkey + securityContext: + fsGroup: 1000 + runAsGroup: 1000 + runAsUser: 1000 + seccompProfile: + type: RuntimeDefault + initContainers: + - name: immich-valkey-init + image: docker.io/valkey/valkey:9.0.3@sha256:3b55fbaa0cd93cf0d9d961f405e4dfcc70efe325e2d84da207a0a8e6d8fde4f9 + imagePullPolicy: IfNotPresent + securityContext: + allowPrivilegeEscalation: false + capabilities: + drop: + - ALL + readOnlyRootFilesystem: true + runAsNonRoot: true + runAsUser: 1000 + command: ["/scripts/init.sh"] + env: + - name: POD_INDEX + valueFrom: + fieldRef: + fieldPath: metadata.labels['apps.kubernetes.io/pod-index'] + volumeMounts: + - name: valkey-data + mountPath: /data + - name: scripts + mountPath: /scripts + containers: + - name: immich-valkey + image: docker.io/valkey/valkey:9.0.3@sha256:3b55fbaa0cd93cf0d9d961f405e4dfcc70efe325e2d84da207a0a8e6d8fde4f9 + imagePullPolicy: IfNotPresent + command: ["valkey-server"] + args: ["/data/conf/valkey.conf"] + securityContext: + allowPrivilegeEscalation: false + capabilities: + drop: + - ALL + readOnlyRootFilesystem: true + runAsNonRoot: true + runAsUser: 1000 + env: + - name: POD_INDEX + valueFrom: + fieldRef: + fieldPath: metadata.labels['apps.kubernetes.io/pod-index'] + - name: VALKEY_LOGLEVEL + value: "notice" + ports: + - name: tcp + containerPort: 6379 + protocol: TCP + startupProbe: + exec: + command: ["sh", "-c", "valkey-cli ping"] + livenessProbe: + exec: + command: ["sh", "-c", "valkey-cli ping"] + resources: + requests: + cpu: 10m + memory: 20Mi + volumeMounts: + - name: valkey-data + mountPath: /data + - name: metrics + image: ghcr.io/oliver006/redis_exporter:v1.83.0@sha256:e8c209894d4c0cc55b1259ddd47e0b769ad1ff864b356736ee885462a3b0e48c + imagePullPolicy: "IfNotPresent" + ports: + - name: metrics + containerPort: 9121 + startupProbe: + tcpSocket: + port: metrics + livenessProbe: + tcpSocket: + port: metrics + readinessProbe: + httpGet: + path: / + port: metrics + resources: + requests: + cpu: 1m + memory: 10M + env: + - name: REDIS_ALIAS + value: immich-valkey + volumes: + - name: scripts + configMap: + name: immich-valkey-init-scripts + defaultMode: 0555