monit: Set a high timeout waiting for status changes
Instead of waiting for up to a certain number of retries we set a high timeout and only re-check every five seconds. Certain services can take a minute or more to start and we want to avoid waisting resources by polling too often.
This commit is contained in:
parent
262f2e9048
commit
72155d40a3
1 changed files with 16 additions and 16 deletions
|
@ -18,7 +18,7 @@
|
||||||
# You should have received a copy of the GNU General Public License
|
# You should have received a copy of the GNU General Public License
|
||||||
# along with Ansible. If not, see <http://www.gnu.org/licenses/>.
|
# along with Ansible. If not, see <http://www.gnu.org/licenses/>.
|
||||||
#
|
#
|
||||||
from time import sleep
|
import time
|
||||||
|
|
||||||
DOCUMENTATION = '''
|
DOCUMENTATION = '''
|
||||||
---
|
---
|
||||||
|
@ -39,12 +39,13 @@ options:
|
||||||
required: true
|
required: true
|
||||||
default: null
|
default: null
|
||||||
choices: [ "present", "started", "stopped", "restarted", "monitored", "unmonitored", "reloaded" ]
|
choices: [ "present", "started", "stopped", "restarted", "monitored", "unmonitored", "reloaded" ]
|
||||||
max_retries:
|
timeout:
|
||||||
description:
|
description:
|
||||||
- If there are pending actions for the service monitoried by monit Ansible will retry this
|
- If there are pending actions for the service monitored by monit, then Ansible will check
|
||||||
many times to perform the requested action. Between each retry Ansible will sleep for 1 second.
|
for up to this many seconds to verify the the requested action has been performed.
|
||||||
|
Ansible will sleep for five seconds between each check.
|
||||||
required: false
|
required: false
|
||||||
default: 10
|
default: 300
|
||||||
version_added: "2.0"
|
version_added: "2.0"
|
||||||
requirements: [ ]
|
requirements: [ ]
|
||||||
author: "Darryl Stoflet (@dstoflet)"
|
author: "Darryl Stoflet (@dstoflet)"
|
||||||
|
@ -58,7 +59,7 @@ EXAMPLES = '''
|
||||||
def main():
|
def main():
|
||||||
arg_spec = dict(
|
arg_spec = dict(
|
||||||
name=dict(required=True),
|
name=dict(required=True),
|
||||||
max_retries=dict(default=10, type='int'),
|
timeout=dict(default=300, type='int'),
|
||||||
state=dict(required=True, choices=['present', 'started', 'restarted', 'stopped', 'monitored', 'unmonitored', 'reloaded'])
|
state=dict(required=True, choices=['present', 'started', 'restarted', 'stopped', 'monitored', 'unmonitored', 'reloaded'])
|
||||||
)
|
)
|
||||||
|
|
||||||
|
@ -66,7 +67,7 @@ def main():
|
||||||
|
|
||||||
name = module.params['name']
|
name = module.params['name']
|
||||||
state = module.params['state']
|
state = module.params['state']
|
||||||
max_retries = module.params['max_retries']
|
timeout = module.params['timeout']
|
||||||
|
|
||||||
MONIT = module.get_bin_path('monit', True)
|
MONIT = module.get_bin_path('monit', True)
|
||||||
|
|
||||||
|
@ -88,23 +89,22 @@ def main():
|
||||||
module.run_command('%s %s %s' % (MONIT, command, name), check_rc=True)
|
module.run_command('%s %s %s' % (MONIT, command, name), check_rc=True)
|
||||||
return status()
|
return status()
|
||||||
|
|
||||||
def wait_for_monit_to_stop_pending(sleep_time=1):
|
def wait_for_monit_to_stop_pending():
|
||||||
"""Fails this run if there is no status or it's pending/initalizing for max_retries"""
|
"""Fails this run if there is no status or it's pending/initalizing for timeout"""
|
||||||
running_status = status()
|
timeout_time = time.time() + timeout
|
||||||
retries = 0
|
sleep_time = 5
|
||||||
|
|
||||||
|
running_status = status()
|
||||||
while running_status == '' or 'pending' in running_status or 'initializing' in running_status:
|
while running_status == '' or 'pending' in running_status or 'initializing' in running_status:
|
||||||
if retries >= max_retries:
|
if time.time() >= timeout_time:
|
||||||
module.fail_json(
|
module.fail_json(
|
||||||
msg='too many retries waiting for empty, "pending", or "initiating" status to go away ({0})'.format(
|
msg='waited too long for "pending", or "initiating" status to go away ({0})'.format(
|
||||||
running_status
|
running_status
|
||||||
),
|
),
|
||||||
retries=retries,
|
|
||||||
state=state
|
state=state
|
||||||
)
|
)
|
||||||
|
|
||||||
sleep(sleep_time)
|
time.sleep(sleep_time)
|
||||||
retries += 1
|
|
||||||
running_status = status()
|
running_status = status()
|
||||||
|
|
||||||
if state == 'reloaded':
|
if state == 'reloaded':
|
||||||
|
|
Loading…
Add table
Reference in a new issue