modules/nixos/monitoring: add ofborg prometheus and eval queue alert

This commit is contained in:
zowoq 2024-01-28 15:14:02 +10:00
parent 4b8e915bc3
commit 9e026e0366
2 changed files with 9 additions and 0 deletions
modules/nixos/monitoring

View file

@ -26,6 +26,12 @@
annotations.description = "{{$labels.host}} should have a running {{$labels.name}}";
};
OfBorgEvalQueue = {
expr = ''ofborg_queue_evaluator_waiting > (2 * ofborg_queue_evaluator_consumers)'';
for = "1h";
annotations.description = "ofborg evaluator queue is more than 2x the number of evaluators";
};
SmartErrors.expr = lib.mkForce ''smart_device_health_ok{enabled!="Disabled", host!="build01"} != 1'';
};
};

View file

@ -41,5 +41,8 @@
timeout = "10s";
})
hosts;
prometheus.urls = [
"https://events.ofborg.org/prometheus.php"
];
};
}