Monitors for containers stuck in restart loops or unhealthy states: - Critical: restart loop (≥3 restarts) - Warning: restarting, exited abnormally, or unhealthy Disabled by default in config.json. Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
68 lines
1.2 KiB
JSON
68 lines
1.2 KiB
JSON
{
|
|
"port": 5100,
|
|
"aggregator": {
|
|
"script": "aggregator.py"
|
|
},
|
|
"detectors": [
|
|
{
|
|
"name": "disk_space",
|
|
"enabled": true,
|
|
"script": "detectors/disk_space.py",
|
|
"env": {
|
|
"CHECK_INTERVAL": "300",
|
|
"THRESHOLD_WARNING": "85",
|
|
"THRESHOLD_CRITICAL": "95"
|
|
}
|
|
},
|
|
{
|
|
"name": "cpu",
|
|
"enabled": true,
|
|
"script": "detectors/cpu.py",
|
|
"env": {
|
|
"CHECK_INTERVAL": "30",
|
|
"THRESHOLD_WARNING": "85",
|
|
"THRESHOLD_CRITICAL": "95"
|
|
}
|
|
},
|
|
{
|
|
"name": "memory",
|
|
"enabled": true,
|
|
"script": "detectors/memory.py",
|
|
"env": {
|
|
"CHECK_INTERVAL": "30",
|
|
"THRESHOLD_WARNING": "85",
|
|
"THRESHOLD_CRITICAL": "95"
|
|
}
|
|
},
|
|
{
|
|
"name": "service",
|
|
"enabled": false,
|
|
"script": "detectors/service.py",
|
|
"env": {
|
|
"CHECK_INTERVAL": "30",
|
|
"SERVICES": "nginx,postgres"
|
|
}
|
|
},
|
|
{
|
|
"name": "network",
|
|
"enabled": false,
|
|
"script": "detectors/network.py",
|
|
"env": {
|
|
"CHECK_INTERVAL": "60",
|
|
"HOSTS": "8.8.8.8,google.com",
|
|
"TIMEOUT": "5"
|
|
}
|
|
},
|
|
{
|
|
"name": "docker",
|
|
"enabled": false,
|
|
"script": "detectors/docker.py",
|
|
"env": {
|
|
"CHECK_INTERVAL": "60",
|
|
"RESTART_THRESHOLD": "3",
|
|
"CONTAINERS": ""
|
|
}
|
|
}
|
|
]
|
|
}
|