diff --git a/CHANGES.md b/CHANGES.md index 46faa2a4c..e2cb82c1e 100644 --- a/CHANGES.md +++ b/CHANGES.md @@ -10,6 +10,9 @@ Notable changes between versions. #### Addons * Raise nginx-ingress liveness/readiness timeout to 5 seconds +* Improve Prometheus metrics labels and drop extraneous metrics ([#397](https://github.com/poseidon/typhoon/pull/397)) + * Add `pod` name label to metrics discovered via service endpoints + * Rename `kubernetes_namespace` label to `namespace` ## v1.13.3 diff --git a/addons/prometheus/config.yaml b/addons/prometheus/config.yaml index b1d383071..3ea5b65dd 100644 --- a/addons/prometheus/config.yaml +++ b/addons/prometheus/config.yaml @@ -55,6 +55,17 @@ data: action: replace target_label: job + metric_relabel_configs: + - source_labels: [__name__] + action: drop + regex: etcd_(debugging|disk|request|server).* + - source_labels: [__name__] + action: drop + regex: apiserver_admission_controller_admission_latencies_seconds_.* + - source_labels: [__name__] + action: drop + regex: apiserver_admission_step_admission_latencies_seconds_.* + # Scrape config for node (i.e. kubelet) /metrics (e.g. 'kubelet_'). Explore # metrics from a node by scraping kubelet (127.0.0.1:10250/metrics). - job_name: 'kubelet' @@ -89,6 +100,13 @@ data: relabel_configs: - action: labelmap regex: __meta_kubernetes_node_label_(.+) + metric_relabel_configs: + - source_labels: [__name__, image] + action: drop + regex: container_([a-z_]+); + - source_labels: [__name__] + action: drop + regex: container_(network_tcp_usage_total|network_udp_usage_total|tasks_state|cpu_load_average_10s) # Scrap etcd metrics from controllers via listen-metrics-urls @@ -119,10 +137,10 @@ data: # * `prometheus.io/port`: If the metrics are exposed on a different port to the # service then set this appropriately. - job_name: 'kubernetes-service-endpoints' - kubernetes_sd_configs: - role: endpoints + honor_labels: true relabel_configs: - source_labels: [__meta_kubernetes_service_annotation_prometheus_io_scrape] action: keep @@ -144,10 +162,18 @@ data: regex: __meta_kubernetes_service_label_(.+) - source_labels: [__meta_kubernetes_namespace] action: replace - target_label: kubernetes_namespace + target_label: namespace + - source_labels: [__meta_kubernetes_pod_name] + action: replace + target_label: pod - source_labels: [__meta_kubernetes_service_name] action: replace target_label: job + + metric_relabel_configs: + - source_labels: [__name__] + action: drop + regex: etcd_(debugging|disk|request|server).* # Example scrape config for probing services via the Blackbox Exporter. # @@ -177,7 +203,7 @@ data: - action: labelmap regex: __meta_kubernetes_service_label_(.+) - source_labels: [__meta_kubernetes_namespace] - target_label: kubernetes_namespace + target_label: namespace - source_labels: [__meta_kubernetes_service_name] target_label: job