Filippo Giunchedi has submitted this change and it was merged. Change subject: prometheus: add aggregation rules for ops ......................................................................
prometheus: add aggregation rules for ops Change-Id: I1fd1ea3e590651f0259fda82340ad62e7d365545 --- A modules/role/files/prometheus/rules_ops.conf M modules/role/manifests/prometheus/ops.pp 2 files changed, 22 insertions(+), 0 deletions(-) Approvals: Filippo Giunchedi: Looks good to me, approved jenkins-bot: Verified diff --git a/modules/role/files/prometheus/rules_ops.conf b/modules/role/files/prometheus/rules_ops.conf new file mode 100644 index 0000000..2f81ef3 --- /dev/null +++ b/modules/role/files/prometheus/rules_ops.conf @@ -0,0 +1,17 @@ +# https://prometheus.io/docs/practices/rules/ + +instance:node_cpu:count = count(node_cpu{mode="idle",job="node"}) by (instance, cluster) + +cluster_device:network_transmit_bytes:rate5m = sum(rate(node_network_transmit_bytes{job="node"}[5m])) by (cluster,device) +cluster_device:network_receive_bytes:rate5m = sum(rate(node_network_receive_bytes{job="node"}[5m])) by (cluster,device) + +cluster_mode:cpu:rate5m = sum(rate(node_cpu{job="node"}[5m])) by (cluster, mode) + +cluster:memory_MemTotal:sum = sum(node_memory_MemTotal{job="node"}) by (cluster) +cluster:memory_MemCached:sum = sum(node_memory_MemCached{job="node"}) by (cluster) +cluster:memory_MemActive:sum = sum(node_memory_MemActive{job="node"}) by (cluster) + +cluster:load1:sum = sum(node_load1{job="node"}) by (cluster) +cluster:cpu:sum = sum(instance:node_cpu:count) by (cluster) +cluster:up:sum = sum(up{job="node"}) by (cluster) +cluster:up:count = count(up{job="node"}) by (cluster) diff --git a/modules/role/manifests/prometheus/ops.pp b/modules/role/manifests/prometheus/ops.pp index 8ebf848..0d39db9 100644 --- a/modules/role/manifests/prometheus/ops.pp +++ b/modules/role/manifests/prometheus/ops.pp @@ -4,6 +4,7 @@ include base::firewall $targets_path = '/srv/prometheus/ops/targets' + $rules_path = '/srv/prometheus/ops/rules' # Add one job for each of mysql 'group' (i.e. their broad function) # Each job will look for new files matching the glob and load the job @@ -93,4 +94,8 @@ file { "${targets_path}/mysql-labs_${::site}.yaml": source => "puppet:///modules/role/prometheus/mysql-labs_${::site}.yaml", } + + file { "${rules_path}/rules_ops.conf": + source => 'puppet:///modules/role/prometheus/rules_ops.conf', + } } -- To view, visit https://gerrit.wikimedia.org/r/307310 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: merged Gerrit-Change-Id: I1fd1ea3e590651f0259fda82340ad62e7d365545 Gerrit-PatchSet: 2 Gerrit-Project: operations/puppet Gerrit-Branch: production Gerrit-Owner: Filippo Giunchedi <fgiunch...@wikimedia.org> Gerrit-Reviewer: Filippo Giunchedi <fgiunch...@wikimedia.org> Gerrit-Reviewer: jenkins-bot <> _______________________________________________ MediaWiki-commits mailing list MediaWiki-commits@lists.wikimedia.org https://lists.wikimedia.org/mailman/listinfo/mediawiki-commits