Compare commits

..

10 Commits

Author SHA1 Message Date
70b3491072 FIX(velero): increase velero-ui memory limit
- Increase memory from 128Mi to 256Mi
- Fix OOMKilled (exit code 137) issue
2026-01-10 19:00:18 +09:00
39ad7757f8 REFACTOR(repo): remove control-plane scheduling
- Remove nodeSelector for control-plane node
- Remove tolerations for control-plane taint
- Allow pods to schedule on any available node
2026-01-10 18:35:15 +09:00
ffbe97815b FEAT(minio): enable ServiceMonitor for Prometheus
- Add includeNode for per-node metrics
- Add release label for Prometheus discovery
- Set 30s interval and 10s timeout
2026-01-10 17:12:53 +09:00
e22f6211b0 FIX(minio): correct invalid SCANNER_SPEED value
- Change MINIO_SCANNER_SPEED from 'off' to 'slowest'
- 'off' is not a valid value, causing config errors
2026-01-10 17:08:21 +09:00
40e02a4ac4 PERF(velero): disable backup-sync to reduce MinIO load
- Set backupSyncPeriod to 0s
- User only uses manual backups
2026-01-10 17:02:15 +09:00
b4049151d6 PERF(minio): disable scanner to reduce CPU usage
- Change MINIO_SCANNER_SPEED from slow to off
- Velero backups provide data redundancy instead
2026-01-10 16:18:12 +09:00
485b588a7e PERF(storage): adjust resources based on VPA
- Update minio memory 263Mi→175Mi
- Update cnpg memory 128Mi→121Mi
- Update zot memory 128Mi→121Mi
- Update velero memory 128Mi→75Mi
- Update velero nodeAgent memory 256Mi→100Mi
2026-01-10 14:34:29 +09:00
f6a1b29425 PERF(cnpg): reduce operator replicas to 1
- Reduce CNPG operator replicas to 1
- PostgreSQL cluster (3 instances) unchanged
2026-01-10 13:31:58 +09:00
6b626b099a PERF(storage): reduce replicas to 1
- Reduce pgweb replicas from 2 to 1
- Reduce MinIO console replicas from 2 to 1
2026-01-10 13:15:56 +09:00
565b60a970 PERF(storage): add high-priority to MinIO and CNPG
- Remove MinIO tolerations (PreferNoSchedule handles it)
- Add high-priority to MinIO (4 replicas for erasure coding)
- Add high-priority to CNPG operator
2026-01-10 13:14:08 +09:00
8 changed files with 30 additions and 53 deletions

View File

@@ -8,15 +8,15 @@ image:
pullPolicy: IfNotPresent
# Replica count for operator
replicaCount: 2
replicaCount: 1
# Resource requests for operator
resources:
requests:
cpu: 15m
memory: 128Mi
memory: 121Mi
limits:
memory: 128Mi
memory: 121Mi
# RBAC
rbac:
@@ -67,6 +67,9 @@ nodeSelector: {}
# Tolerations
tolerations: []
# High priority for critical database operator
priorityClassName: high-priority
# Affinity - Soft Anti-Affinity to spread pods across nodes
affinity:
podAntiAffinity:

View File

@@ -35,10 +35,10 @@ rootPasswordSecretKey: root-password
# Resources
resources:
requests:
memory: 263Mi
memory: 175Mi
cpu: 15m
limits:
memory: 263Mi
memory: 175Mi
# Service
service:
@@ -58,7 +58,7 @@ environment:
MINIO_API_REPLICATION_MAX_WORKERS: "1"
MINIO_API_REPLICATION_MAX_LRG_WORKERS: "1"
MINIO_API_TRANSITION_WORKERS: "1"
MINIO_SCANNER_SPEED: "slow"
MINIO_SCANNER_SPEED: "slowest"
# API Ingress (S3 endpoint)
ingress:
@@ -101,16 +101,18 @@ affinity:
- minio
topologyKey: kubernetes.io/hostname
# Tolerations for control-plane node (minio-0 runs on control-plane)
tolerations:
- key: "node-role.kubernetes.io/control-plane"
operator: "Exists"
effect: "NoSchedule"
# High priority for critical storage infrastructure
priorityClassName: high-priority
# Prometheus metrics
metrics:
serviceMonitor:
enabled: true # Enable ServiceMonitor for Prometheus scraping
enabled: true
includeNode: true
additionalLabels:
release: prometheus
interval: 30s
scrapeTimeout: 10s
# Disable post-install job by setting all triggers to empty
# Job is created if any of: buckets, users, policies, customCommands, svcaccts exist

View File

@@ -6,7 +6,7 @@ metadata:
labels:
app: minio-console
spec:
replicas: 2
replicas: 1
selector:
matchLabels:
app: minio-console

View File

@@ -3,7 +3,7 @@
controllers:
main:
replicas: 2
replicas: 1
annotations:
reloader.stakater.com/auto: "true"
containers:

View File

@@ -67,10 +67,6 @@ spec:
# Affinity to spread replicas across nodes (soft - prefer different nodes)
affinity:
podAntiAffinityType: preferred
tolerations:
- key: "node-role.kubernetes.io/control-plane"
operator: "Exists"
effect: "NoSchedule"
# Enable superuser access
enableSuperuserAccess: true

View File

@@ -74,9 +74,9 @@ spec:
resources:
requests:
cpu: 15m # VPA recommendation
memory: 128Mi
memory: 256Mi
limits:
memory: 128Mi
memory: 256Mi
service:
type: ClusterIP
@@ -86,15 +86,6 @@ spec:
- name: BASIC_AUTH_ENABLED
value: "false"
# Run on master node with velero controller
nodeSelector:
node-role.kubernetes.io/control-plane: "true"
tolerations:
- key: "node-role.kubernetes.io/control-plane"
operator: "Exists"
effect: "NoSchedule"
affinity: {}
envFrom: []

View File

@@ -17,9 +17,9 @@ replicaCount: 1
resources:
requests:
cpu: 11m
memory: 128Mi
memory: 75Mi
limits:
memory: 128Mi
memory: 75Mi
# Init containers for plugins
initContainers:
@@ -39,16 +39,10 @@ nodeAgent:
privileged: false
resources:
requests:
cpu: 15m # VPA recommendation: 15m
memory: 256Mi
cpu: 15m
memory: 100Mi
limits:
memory: 256Mi
# Run on all nodes including control-plane for full backup coverage
tolerations:
- key: "node-role.kubernetes.io/control-plane"
operator: "Exists"
effect: "NoSchedule"
memory: 100Mi
# Configuration for backup storage
configuration:
# Use existing BackupStorageLocation and VolumeSnapshotLocation
@@ -81,7 +75,8 @@ configuration:
# This prevents status updates that trigger ArgoCD refreshes
storeValidationFrequency: 0s
# Note: backup-sync is enabled to show backups in velero-ui
# Disable backup-sync (user only uses manual backups)
backupSyncPeriod: 0s
# Credentials for S3 access (from Vault via External Secrets)
credentials:
@@ -106,15 +101,5 @@ serviceAccount:
rbac:
create: true
# Node selector - Run on control-plane node for stability
nodeSelector:
node-role.kubernetes.io/control-plane: "true"
# Tolerations - Allow scheduling on control-plane node
tolerations:
- key: "node-role.kubernetes.io/control-plane"
operator: "Exists"
effect: "NoSchedule"
# Affinity (disabled - single replica on master)
affinity: {}

View File

@@ -35,9 +35,9 @@ controllers:
resources:
requests:
cpu: 15m
memory: 128Mi
memory: 121Mi
limits:
memory: 128Mi
memory: 121Mi
service:
zot:
controller: zot