diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml index 6d6d0776dc8b285e0457e7704b6cddb5b26ff8ca..ff0d7aeac902cd324093ef373418e6998e16333b 100644 --- a/.gitlab-ci.yml +++ b/.gitlab-ci.yml @@ -693,7 +693,7 @@ prometheus-alerts: RESOURCE: "kube-prometheus-stack" script: - *debug_information - - export BASIC_AUTH_PW=$(python3 -m stackspin $HOSTNAME secrets | grep stackspin-prometheus-basic-auth | cut -d'=' -f2) + - export BASIC_AUTH_PW=$(python3 -m stackspin $HOSTNAME secrets | grep stackspin-prometheus-basic-auth | awk '{ print $4 }') - cd test/ - bash ../.gitlab/ci_scripts/retry_cmd_until_success.sh 30 10 pytest -s -m prometheus extends: diff --git a/flux2/apps/monitoring/kube-prometheus-stack-values-configmap.yaml b/flux2/apps/monitoring/kube-prometheus-stack-values-configmap.yaml index f44583442f77494943f2c3b37f24c7447cd679d2..12d15a5ebef6c4db228877a6fca818fff7e7d5a8 100644 --- a/flux2/apps/monitoring/kube-prometheus-stack-values-configmap.yaml +++ b/flux2/apps/monitoring/kube-prometheus-stack-values-configmap.yaml @@ -13,11 +13,14 @@ data: kubeEtcd: enabled: false - # Disable kube-controller-manager and kube-scheduler monitoring. See https://github.com/cablespaghetti/k3s-monitoring/issues/2 + # Disable kube-controller-manager, kube-scheduler and kube-proxy monitoring. + # See https://github.com/cablespaghetti/k3s-monitoring/issues/2 kubeControllerManager: enabled: false kubeScheduler: enabled: false + kubeProxy: + enabled: false # https://github.com/prometheus-community/helm-charts/blob/main/charts/kube-prometheus-stack/values.yaml#L115 alertmanager: diff --git a/test/pytest/test_prometheus.py b/test/pytest/test_prometheus.py index 542bad0b09b9fdb1bdcb2b2df2f4946398a43db6..7e90f0d874a3d1bc72c4b247b4064bcd8a9545db 100755 --- a/test/pytest/test_prometheus.py +++ b/test/pytest/test_prometheus.py @@ -21,8 +21,7 @@ def ignore_alert(alert): return True # Ignore issues fom high load during installation phase - # KubeProxyDown: https://open.greenhost.net/stackspin/stackspin/-/issues/1105 - if re.search(r"(KubeAPIDown|KubeletDown|NodeFilesystemSpaceFillingUp|NodeClockNotSynchronising|KubeProxyDown)", + if re.search(r"(KubeAPIDown|KubeletDown|NodeFilesystemSpaceFillingUp|NodeClockNotSynchronising)", alert["labels"]["alertname"]): return True # Ignore nextcloud cron jobs (https://open.greenhost.net/stackspin/stackspin/-/issues/984)