Run IPMI check 3 times with 2s timeout
Avoids potential timeouts or deadlocks, and retries if a single try fails.
This commit is contained in:
parent
97329bb90d
commit
9aca8e215b
|
@ -69,26 +69,33 @@ class MonitoringPluginScript(MonitoringPlugin):
|
||||||
|
|
||||||
# Run any imports first
|
# Run any imports first
|
||||||
from daemon_lib.common import run_os_command
|
from daemon_lib.common import run_os_command
|
||||||
|
from time import sleep
|
||||||
|
|
||||||
# Check the node's IPMI interface
|
# Check the node's IPMI interface
|
||||||
ipmi_hostname = self.config["ipmi_hostname"]
|
ipmi_hostname = self.config["ipmi_hostname"]
|
||||||
ipmi_username = self.config["ipmi_username"]
|
ipmi_username = self.config["ipmi_username"]
|
||||||
ipmi_password = self.config["ipmi_password"]
|
ipmi_password = self.config["ipmi_password"]
|
||||||
retcode, _, _ = run_os_command(
|
retcode = 1
|
||||||
f"/usr/bin/ipmitool -I lanplus -H {ipmi_hostname} -U {ipmi_username} -P {ipmi_password} chassis power status",
|
trycount = 0
|
||||||
timeout=5
|
while retcode > 0 and trycount < 3:
|
||||||
)
|
retcode, _, _ = run_os_command(
|
||||||
|
f"/usr/bin/ipmitool -I lanplus -H {ipmi_hostname} -U {ipmi_username} -P {ipmi_password} chassis power status",
|
||||||
|
timeout=2
|
||||||
|
)
|
||||||
|
trycount += 1
|
||||||
|
if retcode > 0 and trycount < 3:
|
||||||
|
sleep(trycount)
|
||||||
|
|
||||||
if retcode > 0:
|
if retcode > 0:
|
||||||
# Set the health delta to 10 (subtract 10 from the total of 100)
|
# Set the health delta to 10 (subtract 10 from the total of 100)
|
||||||
health_delta = 10
|
health_delta = 10
|
||||||
# Craft a message that can be used by the clients
|
# Craft a message that can be used by the clients
|
||||||
message = f"IPMI via {ipmi_username}@{ipmi_hostname} is NOT responding"
|
message = f"IPMI via {ipmi_username}@{ipmi_hostname} is NOT responding after 3 attempts"
|
||||||
else:
|
else:
|
||||||
# Set the health delta to 0 (no change)
|
# Set the health delta to 0 (no change)
|
||||||
health_delta = 0
|
health_delta = 0
|
||||||
# Craft a message that can be used by the clients
|
# Craft a message that can be used by the clients
|
||||||
message = f"IPMI via {ipmi_username}@{ipmi_hostname} is responding"
|
message = f"IPMI via {ipmi_username}@{ipmi_hostname} is responding after {trycount} attempts"
|
||||||
|
|
||||||
# Set the health delta in our local PluginResult object
|
# Set the health delta in our local PluginResult object
|
||||||
self.plugin_result.set_health_delta(health_delta)
|
self.plugin_result.set_health_delta(health_delta)
|
||||||
|
|
Loading…
Reference in New Issue