PERF(observability): remove CPU limits for stability

- Remove CPU limits from all observability components
- Prevents CPU throttling issues across monitoring stack
This commit is contained in:
2026-01-12 02:10:54 +09:00
parent 3b5bf20902
commit 7e61af372b
13 changed files with 2642 additions and 26 deletions

View File

@@ -21,13 +21,12 @@ affinity:
persistence: persistence:
enabled: false enabled: false
# Resource settings (VPA lowerBound/target) # Resource settings (no CPU limit for stability)
resources: resources:
requests: requests:
cpu: 15m cpu: 15m
memory: 100Mi memory: 100Mi
limits: limits:
cpu: 15m
memory: 100Mi memory: 100Mi
# Disable default config - use secret instead # Disable default config - use secret instead

View File

@@ -5,13 +5,12 @@ fullnameOverride: blackbox-exporter
replicas: 1 replicas: 1
# Resource settings (VPA lowerBound/upperBound) # Resource settings (no CPU limit for stability)
resources: resources:
requests: requests:
cpu: 15m cpu: 15m
memory: 100Mi memory: 100Mi
limits: limits:
cpu: 32m
memory: 100Mi memory: 100Mi
config: config:

View File

@@ -6,13 +6,12 @@ dashboard:
enabled: true enabled: true
replicaCount: 1 replicaCount: 1
# Resource settings (VPA lowerBound/upperBound) # Resource settings (no CPU limit for stability)
resources: resources:
requests: requests:
cpu: 15m cpu: 15m
memory: 100Mi memory: 100Mi
limits: limits:
cpu: 15m
memory: 100Mi memory: 100Mi
service: service:
@@ -51,13 +50,12 @@ controller:
enabled: true enabled: true
replicaCount: 1 replicaCount: 1
# Resource settings (VPA lowerBound/upperBound) # Resource settings (no CPU limit for stability)
resources: resources:
requests: requests:
cpu: 15m cpu: 15m
memory: 100Mi memory: 100Mi
limits: limits:
cpu: 25m
memory: 100Mi memory: 100Mi
# Enable VPA recommendations for all namespaces # Enable VPA recommendations for all namespaces

2629
grafana/dashboards/APM.json Normal file

File diff suppressed because it is too large Load Diff

View File

@@ -39,13 +39,12 @@ podSecurityContext:
fsGroup: 472 fsGroup: 472
fsGroupChangePolicy: "Always" fsGroupChangePolicy: "Always"
# Resource settings (VPA lowerBound/upperBound) # Resource settings (no CPU limit for stability)
resources: resources:
requests: requests:
cpu: 22m cpu: 22m
memory: 144Mi memory: 144Mi
limits: limits:
cpu: 24m
memory: 242Mi memory: 242Mi
service: service:

View File

@@ -7,13 +7,12 @@ fullnameOverride: kube-state-metrics
# Note: kube-state-metrics는 stateless이지만, 여러 replica는 동일한 메트릭을 중복 생성하므로 # Note: kube-state-metrics는 stateless이지만, 여러 replica는 동일한 메트릭을 중복 생성하므로
# 단일 replica로 실행하는 것이 권장됩니다. # 단일 replica로 실행하는 것이 권장됩니다.
# Resource settings (VPA lowerBound/upperBound) # Resource settings (no CPU limit for stability)
resources: resources:
requests: requests:
cpu: 15m cpu: 15m
memory: 100Mi memory: 100Mi
limits: limits:
cpu: 15m
memory: 100Mi memory: 100Mi
service: service:

View File

@@ -60,13 +60,12 @@ singleBinary:
mountPath: /var/loki mountPath: /var/loki
# Medium priority for observability # Medium priority for observability
priorityClassName: medium-priority priorityClassName: medium-priority
# Resource settings (VPA lowerBound/target) # Resource settings (no CPU limit for stability)
resources: resources:
requests: requests:
cpu: 10m cpu: 10m
memory: 225Mi memory: 225Mi
limits: limits:
cpu: 69m
memory: 323Mi memory: 323Mi
# Disable components not needed in single binary mode # Disable components not needed in single binary mode

View File

@@ -6,13 +6,12 @@ fullnameOverride: node-exporter
hostNetwork: true hostNetwork: true
hostPID: true hostPID: true
# Resource settings (VPA lowerBound/upperBound) # Resource settings (no CPU limit for stability)
resources: resources:
requests: requests:
cpu: 15m cpu: 15m
memory: 100Mi memory: 100Mi
limits: limits:
cpu: 15m
memory: 100Mi memory: 100Mi
service: service:

View File

@@ -28,14 +28,13 @@ image:
mode: daemonset mode: daemonset
# ============================================================================= # =============================================================================
# Resource Limits (VPA lowerBound/upperBound, mem limit capped at 1024Mi) # Resource Limits (no CPU limit for stability, mem limit capped at 1024Mi)
# ============================================================================= # =============================================================================
resources: resources:
requests: requests:
cpu: 34m cpu: 34m
memory: 142Mi memory: 142Mi
limits: limits:
cpu: 410m
memory: 1024Mi memory: 1024Mi
# ============================================================================= # =============================================================================

View File

@@ -14,13 +14,12 @@ prometheusOperator:
enabled: true enabled: true
# CRD 생성 비활성화 # CRD 생성 비활성화
createCustomResource: false createCustomResource: false
# Resource settings (VPA lowerBound/upperBound) # Resource settings (no CPU limit for stability)
resources: resources:
requests: requests:
cpu: 15m cpu: 15m
memory: 100Mi memory: 100Mi
limits: limits:
cpu: 15m
memory: 100Mi memory: 100Mi
# Kubelet ServiceMonitor with cluster label # Kubelet ServiceMonitor with cluster label

View File

@@ -17,13 +17,12 @@ replicas: 1
# Tempo Configuration # Tempo Configuration
# ============================================================================= # =============================================================================
tempo: tempo:
# Resource settings (VPA lowerBound/target) # Resource settings (no CPU limit for stability)
resources: resources:
requests: requests:
cpu: 15m cpu: 15m
memory: 100Mi memory: 100Mi
limits: limits:
cpu: 15m
memory: 109Mi memory: 109Mi
# Receivers - protocols Tempo accepts # Receivers - protocols Tempo accepts
receivers: receivers:

View File

@@ -46,13 +46,12 @@ query:
- --query.replica-label=prometheus_replica - --query.replica-label=prometheus_replica
- --query.auto-downsampling - --query.auto-downsampling
# Resource settings (VPA lowerBound/target) # Resource settings (no CPU limit for stability)
resources: resources:
requests: requests:
cpu: 15m cpu: 15m
memory: 100Mi memory: 100Mi
limits: limits:
cpu: 15m
memory: 126Mi memory: 126Mi
# ============================================================================= # =============================================================================

View File

@@ -6,13 +6,12 @@ recommender:
enabled: true enabled: true
replicaCount: 1 replicaCount: 1
# Resource settings (VPA lowerBound/upperBound) # Resource settings (no CPU limit for stability)
resources: resources:
requests: requests:
cpu: 15m cpu: 15m
memory: 100Mi memory: 100Mi
limits: limits:
cpu: 15m
memory: 100Mi memory: 100Mi
# Updater - applies recommended resource requests to pods # Updater - applies recommended resource requests to pods