modules/nixos/monitoring: add ofborg prometheus and eval queue alert
This commit is contained in:
parent
4b8e915bc3
commit
9e026e0366
2 changed files with 9 additions and 0 deletions
modules/nixos/monitoring
|
@ -26,6 +26,12 @@
|
|||
annotations.description = "{{$labels.host}} should have a running {{$labels.name}}";
|
||||
};
|
||||
|
||||
OfBorgEvalQueue = {
|
||||
expr = ''ofborg_queue_evaluator_waiting > (2 * ofborg_queue_evaluator_consumers)'';
|
||||
for = "1h";
|
||||
annotations.description = "ofborg evaluator queue is more than 2x the number of evaluators";
|
||||
};
|
||||
|
||||
SmartErrors.expr = lib.mkForce ''smart_device_health_ok{enabled!="Disabled", host!="build01"} != 1'';
|
||||
};
|
||||
};
|
||||
|
|
|
@ -41,5 +41,8 @@
|
|||
timeout = "10s";
|
||||
})
|
||||
hosts;
|
||||
prometheus.urls = [
|
||||
"https://events.ofborg.org/prometheus.php"
|
||||
];
|
||||
};
|
||||
}
|
||||
|
|
Loading…
Add table
Reference in a new issue