PERF(observability): remove CPU limits for stability

- Remove CPU limits from all observability components
- Prevents CPU throttling issues across monitoring stack
This commit is contained in:
2026-01-12 02:10:54 +09:00
parent 3b5bf20902
commit 7e61af372b
13 changed files with 2642 additions and 26 deletions

View File

@@ -21,13 +21,12 @@ affinity:
persistence:
enabled: false
# Resource settings (VPA lowerBound/target)
# Resource settings (no CPU limit for stability)
resources:
requests:
cpu: 15m
memory: 100Mi
limits:
cpu: 15m
memory: 100Mi
# Disable default config - use secret instead

View File

@@ -5,13 +5,12 @@ fullnameOverride: blackbox-exporter
replicas: 1
# Resource settings (VPA lowerBound/upperBound)
# Resource settings (no CPU limit for stability)
resources:
requests:
cpu: 15m
memory: 100Mi
limits:
cpu: 32m
memory: 100Mi
config:

View File

@@ -6,13 +6,12 @@ dashboard:
enabled: true
replicaCount: 1
# Resource settings (VPA lowerBound/upperBound)
# Resource settings (no CPU limit for stability)
resources:
requests:
cpu: 15m
memory: 100Mi
limits:
cpu: 15m
memory: 100Mi
service:
@@ -51,13 +50,12 @@ controller:
enabled: true
replicaCount: 1
# Resource settings (VPA lowerBound/upperBound)
# Resource settings (no CPU limit for stability)
resources:
requests:
cpu: 15m
memory: 100Mi
limits:
cpu: 25m
memory: 100Mi
# Enable VPA recommendations for all namespaces

2629
grafana/dashboards/APM.json Normal file

File diff suppressed because it is too large Load Diff

View File

@@ -39,13 +39,12 @@ podSecurityContext:
fsGroup: 472
fsGroupChangePolicy: "Always"
# Resource settings (VPA lowerBound/upperBound)
# Resource settings (no CPU limit for stability)
resources:
requests:
cpu: 22m
memory: 144Mi
limits:
cpu: 24m
memory: 242Mi
service:

View File

@@ -7,13 +7,12 @@ fullnameOverride: kube-state-metrics
# Note: kube-state-metrics는 stateless이지만, 여러 replica는 동일한 메트릭을 중복 생성하므로
# 단일 replica로 실행하는 것이 권장됩니다.
# Resource settings (VPA lowerBound/upperBound)
# Resource settings (no CPU limit for stability)
resources:
requests:
cpu: 15m
memory: 100Mi
limits:
cpu: 15m
memory: 100Mi
service:

View File

@@ -60,13 +60,12 @@ singleBinary:
mountPath: /var/loki
# Medium priority for observability
priorityClassName: medium-priority
# Resource settings (VPA lowerBound/target)
# Resource settings (no CPU limit for stability)
resources:
requests:
cpu: 10m
memory: 225Mi
limits:
cpu: 69m
memory: 323Mi
# Disable components not needed in single binary mode

View File

@@ -6,13 +6,12 @@ fullnameOverride: node-exporter
hostNetwork: true
hostPID: true
# Resource settings (VPA lowerBound/upperBound)
# Resource settings (no CPU limit for stability)
resources:
requests:
cpu: 15m
memory: 100Mi
limits:
cpu: 15m
memory: 100Mi
service:

View File

@@ -28,14 +28,13 @@ image:
mode: daemonset
# =============================================================================
# Resource Limits (VPA lowerBound/upperBound, mem limit capped at 1024Mi)
# Resource Limits (no CPU limit for stability, mem limit capped at 1024Mi)
# =============================================================================
resources:
requests:
cpu: 34m
memory: 142Mi
limits:
cpu: 410m
memory: 1024Mi
# =============================================================================

View File

@@ -14,13 +14,12 @@ prometheusOperator:
enabled: true
# CRD 생성 비활성화
createCustomResource: false
# Resource settings (VPA lowerBound/upperBound)
# Resource settings (no CPU limit for stability)
resources:
requests:
cpu: 15m
memory: 100Mi
limits:
cpu: 15m
memory: 100Mi
# Kubelet ServiceMonitor with cluster label

View File

@@ -17,13 +17,12 @@ replicas: 1
# Tempo Configuration
# =============================================================================
tempo:
# Resource settings (VPA lowerBound/target)
# Resource settings (no CPU limit for stability)
resources:
requests:
cpu: 15m
memory: 100Mi
limits:
cpu: 15m
memory: 109Mi
# Receivers - protocols Tempo accepts
receivers:

View File

@@ -46,13 +46,12 @@ query:
- --query.replica-label=prometheus_replica
- --query.auto-downsampling
# Resource settings (VPA lowerBound/target)
# Resource settings (no CPU limit for stability)
resources:
requests:
cpu: 15m
memory: 100Mi
limits:
cpu: 15m
memory: 126Mi
# =============================================================================

View File

@@ -6,13 +6,12 @@ recommender:
enabled: true
replicaCount: 1
# Resource settings (VPA lowerBound/upperBound)
# Resource settings (no CPU limit for stability)
resources:
requests:
cpu: 15m
memory: 100Mi
limits:
cpu: 15m
memory: 100Mi
# Updater - applies recommended resource requests to pods