feat: Enhance telemetry services with Kubernetes cluster auto-discovery and health check configuration

This commit is contained in:
Nawaz Dhandala
2026-03-18 11:20:13 +00:00
parent 4cba330605
commit e4a76117b1
7 changed files with 244 additions and 40 deletions

View File

@@ -8,6 +8,10 @@ metadata:
{{- include "kubernetes-agent.labels" . | nindent 4 }}
data:
otel-collector-config.yaml: |
extensions:
health_check:
endpoint: "0.0.0.0:13133"
receivers:
# Collect pod logs from /var/log/pods
filelog:
@@ -115,11 +119,13 @@ data:
exporters:
otlphttp:
endpoint: "{{ .Values.oneuptime.url }}"
endpoint: "{{ .Values.oneuptime.url }}/otlp"
headers:
x-oneuptime-token: "${env:ONEUPTIME_API_KEY}"
service:
extensions:
- health_check
pipelines:
logs:
receivers:

View File

@@ -7,6 +7,10 @@ metadata:
{{- include "kubernetes-agent.labels" . | nindent 4 }}
data:
otel-collector-config.yaml: |
extensions:
health_check:
endpoint: "0.0.0.0:13133"
receivers:
# Collect node, pod, and container resource metrics from kubelet
kubeletstats:
@@ -133,22 +137,25 @@ data:
# Batch telemetry for efficient export
batch:
send_batch_size: 1024
send_batch_size: 200
send_batch_max_size: 500
timeout: 10s
# Limit memory usage
memory_limiter:
check_interval: 5s
limit_mib: 400
spike_limit_mib: 100
limit_mib: 1500
spike_limit_mib: 300
exporters:
otlphttp:
endpoint: "{{ .Values.oneuptime.url }}"
endpoint: "{{ .Values.oneuptime.url }}/otlp"
headers:
x-oneuptime-token: "${env:ONEUPTIME_API_KEY}"
service:
extensions:
- health_check
pipelines:
metrics:
receivers:

View File

@@ -29,11 +29,11 @@ deployment:
replicas: 1
resources:
requests:
cpu: 100m
memory: 256Mi
limits:
cpu: 500m
cpu: 200m
memory: 512Mi
limits:
cpu: 1000m
memory: 2Gi
# Control plane monitoring (etcd, API server, scheduler, controller manager)
# Disabled by default — enable for self-managed clusters.