2024-02-27 12:05:24 -06:00
|
|
|
---
|
|
|
|
# yaml-language-server: $schema=https://ks.hsn.dev/helm.toolkit.fluxcd.io/helmrelease_v2beta2.json
|
|
|
|
apiVersion: helm.toolkit.fluxcd.io/v2beta2
|
|
|
|
kind: HelmRelease
|
|
|
|
metadata:
|
|
|
|
name: kube-prometheus-stack
|
|
|
|
spec:
|
|
|
|
interval: 30m
|
|
|
|
timeout: 15m
|
|
|
|
chart:
|
|
|
|
spec:
|
|
|
|
chart: kube-prometheus-stack
|
2024-05-15 18:02:19 -05:00
|
|
|
version: 58.5.3
|
2024-02-27 12:05:24 -06:00
|
|
|
sourceRef:
|
|
|
|
kind: HelmRepository
|
|
|
|
name: prometheus-community
|
|
|
|
namespace: flux-system
|
|
|
|
install:
|
|
|
|
crds: CreateReplace
|
|
|
|
remediation:
|
|
|
|
retries: 3
|
|
|
|
upgrade:
|
|
|
|
cleanupOnFail: true
|
|
|
|
crds: CreateReplace
|
|
|
|
remediation:
|
2024-04-08 10:43:05 -05:00
|
|
|
strategy: rollback
|
2024-02-27 12:05:24 -06:00
|
|
|
retries: 3
|
|
|
|
values:
|
|
|
|
crds:
|
|
|
|
enabled: true
|
|
|
|
cleanPrometheusOperatorObjectNames: true
|
|
|
|
alertmanager:
|
|
|
|
ingress:
|
|
|
|
enabled: true
|
|
|
|
pathType: Prefix
|
|
|
|
ingressClassName: internal-nginx
|
|
|
|
hosts:
|
|
|
|
- &host alertmanager.jahanson.tech
|
|
|
|
tls:
|
|
|
|
- hosts:
|
|
|
|
- *host
|
|
|
|
alertmanagerSpec:
|
2024-05-07 13:31:53 -05:00
|
|
|
replicas: 1
|
2024-02-27 12:05:24 -06:00
|
|
|
useExistingSecret: true
|
|
|
|
configSecret: alertmanager-secret
|
|
|
|
storage:
|
|
|
|
volumeClaimTemplate:
|
|
|
|
spec:
|
2024-05-07 19:05:31 -05:00
|
|
|
storageClassName: openebs-zfs
|
2024-02-27 12:05:24 -06:00
|
|
|
resources:
|
|
|
|
requests:
|
|
|
|
storage: 1Gi
|
|
|
|
kubelet:
|
|
|
|
enabled: true
|
|
|
|
serviceMonitor:
|
|
|
|
metricRelabelings:
|
|
|
|
# Drop high cardinality labels
|
|
|
|
- action: labeldrop
|
|
|
|
regex: (uid)
|
|
|
|
- action: labeldrop
|
|
|
|
regex: (id|name)
|
|
|
|
- action: drop
|
|
|
|
sourceLabels: ["__name__"]
|
|
|
|
regex: (rest_client_request_duration_seconds_bucket|rest_client_request_duration_seconds_sum|rest_client_request_duration_seconds_count)
|
|
|
|
kubeApiServer:
|
|
|
|
enabled: true
|
|
|
|
serviceMonitor:
|
|
|
|
metricRelabelings:
|
|
|
|
# Drop high cardinality labels
|
|
|
|
- action: drop
|
|
|
|
sourceLabels: ["__name__"]
|
|
|
|
regex: (apiserver|etcd|rest_client)_request(|_sli|_slo)_duration_seconds_bucket
|
|
|
|
- action: drop
|
|
|
|
sourceLabels: ["__name__"]
|
|
|
|
regex: (apiserver_response_sizes_bucket|apiserver_watch_events_sizes_bucket)
|
|
|
|
kubeControllerManager:
|
|
|
|
enabled: true
|
|
|
|
endpoints: &cp
|
2024-02-27 16:22:07 -06:00
|
|
|
- 10.1.1.61
|
2024-02-27 12:05:24 -06:00
|
|
|
kubeEtcd:
|
|
|
|
enabled: true
|
|
|
|
endpoints: *cp
|
|
|
|
kubeScheduler:
|
|
|
|
enabled: true
|
|
|
|
endpoints: *cp
|
|
|
|
kubeProxy:
|
|
|
|
enabled: false
|
|
|
|
prometheus:
|
|
|
|
ingress:
|
|
|
|
enabled: true
|
|
|
|
ingressClassName: internal-nginx
|
|
|
|
pathType: Prefix
|
|
|
|
hosts:
|
|
|
|
- &host prometheus.jahanson.tech
|
|
|
|
tls:
|
|
|
|
- hosts:
|
|
|
|
- *host
|
|
|
|
thanosService:
|
|
|
|
enabled: true
|
|
|
|
thanosServiceMonitor:
|
|
|
|
enabled: true
|
2024-04-08 10:43:05 -05:00
|
|
|
# thanosServiceExternal:
|
|
|
|
# enabled: true
|
|
|
|
# type: LoadBalancer
|
|
|
|
# annotations:
|
|
|
|
# external-dns.alpha.kubernetes.io/hostname: thanos.jahanson.tech
|
|
|
|
# io.cilium/lb-ipam-ips: 10.45.0.6
|
|
|
|
# externalTrafficPolicy: Cluster
|
2024-02-27 12:05:24 -06:00
|
|
|
prometheusSpec:
|
2024-04-07 10:58:32 -05:00
|
|
|
podMetadata:
|
|
|
|
annotations:
|
|
|
|
secret.reloader.stakater.com/reload: &secret thanos-objstore-config
|
2024-05-07 13:31:53 -05:00
|
|
|
replicas: 1
|
2024-02-27 12:05:24 -06:00
|
|
|
replicaExternalLabelName: __replica__
|
2024-03-05 07:38:37 -06:00
|
|
|
scrapeInterval: 1m # Must match interval in Grafana Helm chart
|
2024-02-27 12:05:24 -06:00
|
|
|
ruleSelectorNilUsesHelmValues: false
|
|
|
|
serviceMonitorSelectorNilUsesHelmValues: false
|
|
|
|
podMonitorSelectorNilUsesHelmValues: false
|
|
|
|
probeSelectorNilUsesHelmValues: false
|
|
|
|
scrapeConfigSelectorNilUsesHelmValues: false
|
|
|
|
enableAdminAPI: true
|
|
|
|
walCompression: true
|
|
|
|
enableFeatures:
|
2024-04-08 10:43:05 -05:00
|
|
|
- auto-gomemlimit
|
2024-02-27 12:05:24 -06:00
|
|
|
- memory-snapshot-on-shutdown
|
|
|
|
- new-service-discovery-manager
|
2024-03-19 11:05:35 -05:00
|
|
|
image:
|
|
|
|
registry: quay.io
|
|
|
|
repository: prometheus/prometheus
|
2024-03-22 07:36:51 -05:00
|
|
|
tag: v2.51.0-dedupelabels
|
2024-02-27 12:05:24 -06:00
|
|
|
thanos:
|
|
|
|
image: quay.io/thanos/thanos:${THANOS_VERSION}
|
|
|
|
version: "${THANOS_VERSION#v}"
|
|
|
|
objectStorageConfig:
|
|
|
|
existingSecret:
|
2024-04-07 10:58:32 -05:00
|
|
|
name: *secret
|
|
|
|
key: config
|
2024-02-27 12:05:24 -06:00
|
|
|
retention: 2d
|
|
|
|
retentionSize: 15GB
|
|
|
|
externalLabels:
|
|
|
|
cluster: main
|
|
|
|
storageSpec:
|
|
|
|
volumeClaimTemplate:
|
|
|
|
spec:
|
2024-05-07 19:05:31 -05:00
|
|
|
storageClassName: openebs-zfs
|
2024-02-27 12:05:24 -06:00
|
|
|
resources:
|
|
|
|
requests:
|
|
|
|
storage: 20Gi
|
|
|
|
nodeExporter:
|
|
|
|
enabled: true
|
|
|
|
prometheus-node-exporter:
|
|
|
|
fullnameOverride: node-exporter
|
|
|
|
prometheus:
|
|
|
|
monitor:
|
|
|
|
enabled: true
|
|
|
|
relabelings:
|
|
|
|
- action: replace
|
|
|
|
regex: (.*)
|
|
|
|
replacement: $1
|
|
|
|
sourceLabels:
|
|
|
|
- __meta_kubernetes_pod_node_name
|
|
|
|
targetLabel: kubernetes_node
|
|
|
|
kubeStateMetrics:
|
|
|
|
enabled: true
|
|
|
|
kube-state-metrics:
|
|
|
|
fullnameOverride: kube-state-metrics
|
|
|
|
metricLabelsAllowlist:
|
|
|
|
- pods=[*]
|
|
|
|
- deployments=[*]
|
|
|
|
- persistentvolumeclaims=[*]
|
|
|
|
prometheus:
|
|
|
|
monitor:
|
|
|
|
enabled: true
|
|
|
|
relabelings:
|
|
|
|
- action: replace
|
|
|
|
regex: (.*)
|
|
|
|
replacement: $1
|
|
|
|
sourceLabels:
|
|
|
|
- __meta_kubernetes_pod_node_name
|
|
|
|
targetLabel: kubernetes_node
|
|
|
|
grafana:
|
|
|
|
enabled: false
|
|
|
|
forceDeployDashboards: true
|
|
|
|
sidecar:
|
|
|
|
dashboards:
|
2024-04-08 10:43:05 -05:00
|
|
|
annotations:
|
|
|
|
grafana_folder: Kubernetes
|
2024-02-27 12:05:24 -06:00
|
|
|
multicluster:
|
|
|
|
etcd:
|
2024-05-07 13:31:53 -05:00
|
|
|
enabled: true
|