AAP-78420: Updating the remediation condition in system.py to check for cpu and memory values set to 0. (#16499)

Updating the remediation condition on line 636 to check for cpu and memory values set to 0.
This commit is contained in:
thanujdesu11
2026-06-18 13:05:04 -04:00
committed by GitHub
parent c1bd2eb338
commit f8fc3d107f

View File

@@ -633,7 +633,7 @@ def inspect_execution_and_hop_nodes(instance_list):
# check
logger.warning(f'Execution node attempting to rejoin as instance {hostname}.')
execution_node_health_check.apply_async([hostname])
elif instance.capacity == 0 and instance.enabled:
elif (instance.capacity == 0 or (instance.cpu == 0 and instance.memory == 0)) and instance.enabled:
# nodes with proven connection but need remediation run health checks are reduced frequency
if not instance.last_health_check or (nowtime - instance.last_health_check).total_seconds() >= settings.EXECUTION_NODE_REMEDIATION_CHECKS:
# Periodically re-run the health check of errored nodes, in case someone fixed it