Merge pull request #2387 from brancz/reduce-metrics

Reduce metrics
This commit is contained in:
Frederic Branczyk
2019-02-06 16:02:24 +01:00
committed by GitHub
5 changed files with 54 additions and 10 deletions

View File

@@ -282,6 +282,22 @@ local k = import 'ksonnet/ksonnet.beta.3/k.libsonnet';
insecureSkipVerify: true, insecureSkipVerify: true,
}, },
bearerTokenFile: '/var/run/secrets/kubernetes.io/serviceaccount/token', bearerTokenFile: '/var/run/secrets/kubernetes.io/serviceaccount/token',
metricRelabelings: [
// Drop container_* metrics with no image.
{
sourceLabels: ['__name__', 'image'],
regex: 'container_([a-z_]+);',
action: 'drop',
},
// Drop a bunch of metrics which are disabled but still sent, see
// https://github.com/google/cadvisor/issues/1925.
{
sourceLabels: ['__name__'],
regex: 'container_(network_tcp_usage_total|network_udp_usage_total|tasks_state|cpu_load_average_10s)',
action: 'drop',
},
],
}, },
], ],
selector: { selector: {
@@ -374,6 +390,16 @@ local k = import 'ksonnet/ksonnet.beta.3/k.libsonnet';
regex: 'etcd_(debugging|disk|request|server).*', regex: 'etcd_(debugging|disk|request|server).*',
action: 'drop', action: 'drop',
}, },
{
sourceLabels: ['__name__'],
regex: 'apiserver_admission_controller_admission_latencies_seconds_.*',
action: 'drop',
},
{
sourceLabels: ['__name__'],
regex: 'apiserver_admission_step_admission_latencies_seconds_.*',
action: 'drop',
},
], ],
}, },
], ],

View File

@@ -8,7 +8,7 @@
"subdir": "contrib/kube-prometheus/jsonnet/kube-prometheus" "subdir": "contrib/kube-prometheus/jsonnet/kube-prometheus"
} }
}, },
"version": "6963b7410f28575a90a65c0aee1c79c8ef392fbb" "version": "986d387aaa6c292c248fc9d31c8b564462bd619e"
}, },
{ {
"name": "ksonnet", "name": "ksonnet",
@@ -28,7 +28,7 @@
"subdir": "" "subdir": ""
} }
}, },
"version": "668950e4af13f0153fa1d7b58ebe7023b33f2217" "version": "ae5d0b27229765fc0670c48c09a95cb6da732de3"
}, },
{ {
"name": "grafonnet", "name": "grafonnet",

View File

@@ -241,25 +241,25 @@ spec:
max by (namespace, pod, device) (node_filesystem_avail_bytes{fstype=~"ext[234]|btrfs|xfs|zfs"} / node_filesystem_size_bytes{fstype=~"ext[234]|btrfs|xfs|zfs"}) max by (namespace, pod, device) (node_filesystem_avail_bytes{fstype=~"ext[234]|btrfs|xfs|zfs"} / node_filesystem_size_bytes{fstype=~"ext[234]|btrfs|xfs|zfs"})
record: 'node:node_filesystem_avail:' record: 'node:node_filesystem_avail:'
- expr: | - expr: |
sum(irate(node_network_receive_bytes_total{job="node-exporter",device="eth0"}[1m])) + sum(irate(node_network_receive_bytes_total{job="node-exporter",device!~"veth.+"}[1m])) +
sum(irate(node_network_transmit_bytes_total{job="node-exporter",device="eth0"}[1m])) sum(irate(node_network_transmit_bytes_total{job="node-exporter",device!~"veth.+"}[1m]))
record: :node_net_utilisation:sum_irate record: :node_net_utilisation:sum_irate
- expr: | - expr: |
sum by (node) ( sum by (node) (
(irate(node_network_receive_bytes_total{job="node-exporter",device="eth0"}[1m]) + (irate(node_network_receive_bytes_total{job="node-exporter",device!~"veth.+"}[1m]) +
irate(node_network_transmit_bytes_total{job="node-exporter",device="eth0"}[1m])) irate(node_network_transmit_bytes_total{job="node-exporter",device!~"veth.+"}[1m]))
* on (namespace, pod) group_left(node) * on (namespace, pod) group_left(node)
node_namespace_pod:kube_pod_info: node_namespace_pod:kube_pod_info:
) )
record: node:node_net_utilisation:sum_irate record: node:node_net_utilisation:sum_irate
- expr: | - expr: |
sum(irate(node_network_receive_drop_total{job="node-exporter",device="eth0"}[1m])) + sum(irate(node_network_receive_drop_total{job="node-exporter",device!~"veth.+"}[1m])) +
sum(irate(node_network_transmit_drop_total{job="node-exporter",device="eth0"}[1m])) sum(irate(node_network_transmit_drop_total{job="node-exporter",device!~"veth.+"}[1m]))
record: :node_net_saturation:sum_irate record: :node_net_saturation:sum_irate
- expr: | - expr: |
sum by (node) ( sum by (node) (
(irate(node_network_receive_drop_total{job="node-exporter",device="eth0"}[1m]) + (irate(node_network_receive_drop_total{job="node-exporter",device!~"veth.+"}[1m]) +
irate(node_network_transmit_drop_total{job="node-exporter",device="eth0"}[1m])) irate(node_network_transmit_drop_total{job="node-exporter",device!~"veth.+"}[1m]))
* on (namespace, pod) group_left(node) * on (namespace, pod) group_left(node)
node_namespace_pod:kube_pod_info: node_namespace_pod:kube_pod_info:
) )

View File

@@ -14,6 +14,14 @@ spec:
regex: etcd_(debugging|disk|request|server).* regex: etcd_(debugging|disk|request|server).*
sourceLabels: sourceLabels:
- __name__ - __name__
- action: drop
regex: apiserver_admission_controller_admission_latencies_seconds_.*
sourceLabels:
- __name__
- action: drop
regex: apiserver_admission_step_admission_latencies_seconds_.*
sourceLabels:
- __name__
port: https port: https
scheme: https scheme: https
tlsConfig: tlsConfig:

View File

@@ -17,6 +17,16 @@ spec:
- bearerTokenFile: /var/run/secrets/kubernetes.io/serviceaccount/token - bearerTokenFile: /var/run/secrets/kubernetes.io/serviceaccount/token
honorLabels: true honorLabels: true
interval: 30s interval: 30s
metricRelabelings:
- action: drop
regex: container_([a-z_]+);
sourceLabels:
- __name__
- image
- action: drop
regex: container_(network_tcp_usage_total|network_udp_usage_total|tasks_state|cpu_load_average_10s)
sourceLabels:
- __name__
path: /metrics/cadvisor path: /metrics/cadvisor
port: https-metrics port: https-metrics
scheme: https scheme: https