PERF(resources): remove CPU limits - keep memory limits only

- CPU throttling prevents app startup, not crashes
- Memory OOM is the real cascading failure cause
- CPU request ensures fair scheduling
This commit is contained in:
2026-01-07 23:48:35 +09:00
parent 69dc3b34be
commit 4286296591
10 changed files with 42 additions and 33 deletions

View File

@@ -10,8 +10,10 @@ persistence:
resources: resources:
requests: requests:
cpu: 10m cpu: 15m
memory: 32Mi memory: 100Mi
limits:
memory: 150Mi
# Disable default config - use secret instead # Disable default config - use secret instead
config: config:

View File

@@ -7,12 +7,11 @@ dashboard:
replicaCount: 1 replicaCount: 1
resources: resources:
limits:
cpu: null
memory: 256Mi
requests: requests:
cpu: 25m cpu: 15m
memory: 128Mi memory: 100Mi
limits:
memory: 150Mi
service: service:
type: ClusterIP type: ClusterIP
@@ -39,12 +38,11 @@ controller:
enabled: true enabled: true
resources: resources:
limits:
cpu: null
memory: 256Mi
requests: requests:
cpu: 25m cpu: 15m
memory: 128Mi memory: 100Mi
limits:
memory: 150Mi
# Enable VPA recommendations for all namespaces # Enable VPA recommendations for all namespaces
# Set to false to only monitor namespaces with the label: goldilocks.fairwinds.com/enabled=true # Set to false to only monitor namespaces with the label: goldilocks.fairwinds.com/enabled=true

View File

@@ -24,8 +24,10 @@ podSecurityContext:
resources: resources:
requests: requests:
cpu: 25m cpu: 11m
memory: 128Mi memory: 425Mi
limits:
memory: 425Mi
service: service:
type: ClusterIP type: ClusterIP

View File

@@ -5,8 +5,10 @@ fullnameOverride: kube-state-metrics
resources: resources:
requests: requests:
cpu: 10m cpu: 15m
memory: 64Mi memory: 100Mi
limits:
memory: 150Mi
service: service:
type: ClusterIP type: ClusterIP

View File

@@ -43,8 +43,10 @@ singleBinary:
storageClass: local-path storageClass: local-path
resources: resources:
requests: requests:
cpu: 15m # Reduced from 50m based on actual usage (10m) cpu: 23m
memory: 128Mi memory: 462Mi
limits:
memory: 462Mi
# Disable components not needed in single binary mode # Disable components not needed in single binary mode
backend: backend:

View File

@@ -8,8 +8,10 @@ hostPID: true
resources: resources:
requests: requests:
cpu: 10m cpu: 15m
memory: 50Mi memory: 64Mi
limits:
memory: 96Mi
service: service:
type: ClusterIP type: ClusterIP

View File

@@ -53,11 +53,11 @@ prometheus:
storage: 5Gi storage: 5Gi
resources: resources:
limits:
memory: 1Gi # limit 추가 (무제한 증가 방지)
requests: requests:
cpu: 200m cpu: 200m
memory: 512Mi # 256Mi → 512Mi (실제 사용량 반영) memory: 512Mi
limits:
memory: 768Mi
# ServiceMonitor 자동 발견 - 모든 ServiceMonitor 선택 # ServiceMonitor 자동 발견 - 모든 ServiceMonitor 선택
serviceMonitorSelectorNilUsesHelmValues: false serviceMonitorSelectorNilUsesHelmValues: false

View File

@@ -32,8 +32,10 @@ defaultVolumeMounts:
# Resources # Resources
resources: resources:
requests: requests:
cpu: 25m # Reduced from 50m based on actual usage (8-17m) cpu: 23m
memory: 64Mi memory: 182Mi
limits:
memory: 182Mi
# Tolerations to run on all nodes including master # Tolerations to run on all nodes including master
tolerations: tolerations:

View File

@@ -13,10 +13,10 @@ persistence:
resources: resources:
requests: requests:
cpu: 50m cpu: 15m
memory: 128Mi memory: 200Mi
limits: limits:
memory: 256Mi memory: 300Mi
livenessProbe: livenessProbe:
enabled: true enabled: true

View File

@@ -7,12 +7,11 @@ recommender:
replicaCount: 1 replicaCount: 1
resources: resources:
limits:
cpu: null
memory: 1Gi
requests: requests:
cpu: 50m cpu: 15m
memory: 512Mi memory: 128Mi
limits:
memory: 192Mi
# Updater - applies recommended resource requests to pods # Updater - applies recommended resource requests to pods
# Disabled because we're using updateMode: Off (recommendations only) # Disabled because we're using updateMode: Off (recommendations only)