Defined Type: profile::cache::kafka::varnishkafka_delivery_alert
- Defined in:
- modules/profile/manifests/cache/kafka/varnishkafka_delivery_alert.pp
Overview
Define: profile::cache::kafka::varnishkafka_delivery_alert
Define to ease the creation of all per-dc Varnishkafka Prometheus check for Delivery error failures.
6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 |
# File 'modules/profile/manifests/cache/kafka/varnishkafka_delivery_alert.pp', line 6
define profile::cache::kafka::varnishkafka_delivery_alert(
String $cache_segment,
String $instance,
) {
monitoring::check_prometheus { "varnishkafka-${instance}-${cache_segment}-eqiad-kafka_drerr":
description => "cache_${cache_segment}: Varnishkafka ${instance} Delivery Errors per second (eqiad)",
dashboard_links => ["https://grafana.wikimedia.org/d/000000253/varnishkafka?panelId=20&fullscreen&orgId=1&var-datasource=eqiad prometheus/ops&var-source=${instance}&var-cp_cluster=cache_${cache_segment}&var-instance=All"],
query => "scalar(sum(irate(varnishkafka_delivery_errors_total{cluster=\"cache_${cache_segment}\", source=\"${instance}\"}[5m])))",
prometheus_url => 'http://prometheus.svc.eqiad.wmnet/ops',
warning => 1,
critical => 5,
contact_group => 'analytics',
notes_link => 'https://wikitech.wikimedia.org/wiki/Analytics/Systems/Varnishkafka',
}
monitoring::check_prometheus { "varnishkafka-${instance}-${cache_segment}-codfw-kafka_drerr":
description => "cache_${cache_segment}: Varnishkafka ${instance} Delivery Errors per second (codfw)",
dashboard_links => ["https://grafana.wikimedia.org/d/000000253/varnishkafka?panelId=20&fullscreen&orgId=1&var-datasource=codfw prometheus/ops&prometheus/ops&var-source=${instance}&var-cp_cluster=cache_${cache_segment}&var-instance=All"],
query => "scalar(sum(irate(varnishkafka_delivery_errors_total{cluster=\"cache_${cache_segment}\", source=\"${instance}\"}[5m])))",
prometheus_url => 'http://prometheus.svc.codfw.wmnet/ops',
warning => 1,
critical => 5,
contact_group => 'analytics',
notes_link => 'https://wikitech.wikimedia.org/wiki/Analytics/Systems/Varnishkafka',
}
monitoring::check_prometheus { "varnishkafka-${instance}-${cache_segment}-esams-kafka_drerr":
description => "cache_${cache_segment}: Varnishkafka ${instance} Delivery Errors per second (esams)",
dashboard_links => ["https://grafana.wikimedia.org/d/000000253/varnishkafka?panelId=20&fullscreen&orgId=1&var-datasource=esams prometheus/ops&var-source=${instance}&var-cp_cluster=cache_${cache_segment}&var-instance=All"],
query => "scalar(sum(irate(varnishkafka_delivery_errors_total{cluster=\"cache_${cache_segment}\", source=\"${instance}\"}[5m])))",
prometheus_url => 'http://prometheus.svc.esams.wmnet/ops',
warning => 1,
critical => 5,
contact_group => 'analytics',
notes_link => 'https://wikitech.wikimedia.org/wiki/Analytics/Systems/Varnishkafka',
}
monitoring::check_prometheus { "varnishkafka-${instance}-${cache_segment}-ulsfo-kafka_drerr":
description => "cache_${cache_segment}: Varnishkafka ${instance} Delivery Errors per second (ulsfo)",
dashboard_links => ["https://grafana.wikimedia.org/d/000000253/varnishkafka?panelId=20&fullscreen&orgId=1&var-datasource=ulsfo prometheus/ops&var-source=${instance}&var-cp_cluster=cache_${cache_segment}&var-instance=All"],
query => "scalar(sum(irate(varnishkafka_delivery_errors_total{cluster=\"cache_${cache_segment}\", source=\"${instance}\"}[5m])))",
prometheus_url => 'http://prometheus.svc.ulsfo.wmnet/ops',
warning => 1,
critical => 5,
contact_group => 'analytics',
notes_link => 'https://wikitech.wikimedia.org/wiki/Analytics/Systems/Varnishkafka',
}
monitoring::check_prometheus { "varnishkafka-${instance}-${cache_segment}-eqsin-kafka_drerr":
description => "cache_${cache_segment}: Varnishkafka ${instance} Delivery Errors per second (eqsin)",
dashboard_links => ["https://grafana.wikimedia.org/d/000000253/varnishkafka?panelId=20&fullscreen&orgId=1&var-datasource=eqsin prometheus/ops&var-source=${instance}&var-cp_cluster=cache_${cache_segment}&var-instance=All"],
query => "scalar(sum(irate(varnishkafka_delivery_errors_total{cluster=\"cache_${cache_segment}\", source=\"${instance}\"}[5m])))",
prometheus_url => 'http://prometheus.svc.eqsin.wmnet/ops',
warning => 1,
critical => 5,
contact_group => 'analytics',
notes_link => 'https://wikitech.wikimedia.org/wiki/Analytics/Systems/Varnishkafka',
}
}
|