mirror of https://github.com/ansible/ansible.git
CloudRetry/AWSRetry backoff decorator with unit tests (#17039)
* Added aws_retry decorator function with unit tests * Restructured the code to be used with a base class. This base class CloudRetry can be reused by any other cloud provider. This decorator should be used in situations, where you need to implement a backoff algorithm and want to retry based on the status code from the exception. * updated documentation * fixed tabs * added botocore and boto3 to requirements.txt * removed cloud.py from py24 tests, as it depends on boto3 * fix relative imports * updated test to be 2.6 compat * updated method name from retry to backoff * readded lxd * Updated default backoff from 2 seconds to 1.1s. This will be about a total of 48 seconds in 10 tries. This is configurable.pull/17554/head
parent
60706cc12e
commit
b510abce17
@ -0,0 +1,108 @@
|
|||||||
|
#
|
||||||
|
# (c) 2016 Allen Sanabria, <asanabria@linuxdynasty.org>
|
||||||
|
#
|
||||||
|
# This file is part of Ansible
|
||||||
|
#
|
||||||
|
# Ansible is free software: you can redistribute it and/or modify
|
||||||
|
# it under the terms of the GNU General Public License as published by
|
||||||
|
# the Free Software Foundation, either version 3 of the License, or
|
||||||
|
# (at your option) any later version.
|
||||||
|
#
|
||||||
|
# Ansible is distributed in the hope that it will be useful,
|
||||||
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
# GNU General Public License for more details.
|
||||||
|
#
|
||||||
|
# You should have received a copy of the GNU General Public License
|
||||||
|
# along with Ansible. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
#
|
||||||
|
"""
|
||||||
|
This module adds shared support for generic cloud modules
|
||||||
|
|
||||||
|
In order to use this module, include it as part of a custom
|
||||||
|
module as shown below.
|
||||||
|
|
||||||
|
from ansible.module_utils.cloud import *
|
||||||
|
|
||||||
|
The 'cloud' module provides the following common classes:
|
||||||
|
|
||||||
|
* CloudRetry
|
||||||
|
- The base class to be used by other cloud providers, in order to
|
||||||
|
provide a backoff/retry decorator based on status codes.
|
||||||
|
|
||||||
|
- Example using the AWSRetry class which inherits from CloudRetry.
|
||||||
|
@AWSRetry.retry(tries=20, delay=2, backoff=2)
|
||||||
|
get_ec2_security_group_ids_from_names()
|
||||||
|
|
||||||
|
"""
|
||||||
|
from functools import wraps
|
||||||
|
import syslog
|
||||||
|
import time
|
||||||
|
|
||||||
|
from ansible.module_utils.pycompat24 import get_exception
|
||||||
|
|
||||||
|
|
||||||
|
class CloudRetry(object):
|
||||||
|
""" CloudRetry can be used by any cloud provider, in order to implement a
|
||||||
|
backoff algorithm/retry effect based on Status Code from Exceptions.
|
||||||
|
"""
|
||||||
|
# This is the base class of the exception.
|
||||||
|
# AWS Example botocore.exceptions.ClientError
|
||||||
|
base_class = None
|
||||||
|
|
||||||
|
@staticmethod
|
||||||
|
def status_code_from_exception(error):
|
||||||
|
""" Return the status code from the exception object
|
||||||
|
Args:
|
||||||
|
error (object): The exception itself.
|
||||||
|
"""
|
||||||
|
pass
|
||||||
|
|
||||||
|
@staticmethod
|
||||||
|
def found(response_code):
|
||||||
|
""" Return True if the Response Code to retry on was found.
|
||||||
|
Args:
|
||||||
|
response_code (str): This is the Response Code that is being matched against.
|
||||||
|
"""
|
||||||
|
pass
|
||||||
|
|
||||||
|
@classmethod
|
||||||
|
def backoff(cls, tries=10, delay=3, backoff=1.1):
|
||||||
|
""" Retry calling the Cloud decorated function using an exponential backoff.
|
||||||
|
Kwargs:
|
||||||
|
tries (int): Number of times to try (not retry) before giving up
|
||||||
|
default=10
|
||||||
|
delay (int): Initial delay between retries in seconds
|
||||||
|
default=3
|
||||||
|
backoff (int): backoff multiplier e.g. value of 2 will double the delay each retry
|
||||||
|
default=2
|
||||||
|
|
||||||
|
"""
|
||||||
|
def deco(f):
|
||||||
|
@wraps(f)
|
||||||
|
def retry_func(*args, **kwargs):
|
||||||
|
max_tries, max_delay = tries, delay
|
||||||
|
while max_tries > 1:
|
||||||
|
try:
|
||||||
|
return f(*args, **kwargs)
|
||||||
|
except Exception:
|
||||||
|
e = get_exception()
|
||||||
|
if isinstance(e, cls.base_class):
|
||||||
|
response_code = cls.status_code_from_exception(e)
|
||||||
|
if cls.found(response_code):
|
||||||
|
msg = "{0}: Retrying in {1} seconds...".format(str(e), max_delay)
|
||||||
|
syslog.syslog(syslog.LOG_INFO, msg)
|
||||||
|
time.sleep(max_delay)
|
||||||
|
max_tries -= 1
|
||||||
|
max_delay *= backoff
|
||||||
|
else:
|
||||||
|
# Return original exception if exception is not a ClientError
|
||||||
|
raise e
|
||||||
|
else:
|
||||||
|
# Return original exception if exception is not a ClientError
|
||||||
|
raise e
|
||||||
|
return f(*args, **kwargs)
|
||||||
|
|
||||||
|
return retry_func # true decorator
|
||||||
|
|
||||||
|
return deco
|
||||||
@ -0,0 +1,87 @@
|
|||||||
|
# -*- coding: utf-8 -*-
|
||||||
|
# (c) 2015, Allen Sanabria <asanabria@linuxdynasty.org>
|
||||||
|
#
|
||||||
|
# This file is part of Ansible
|
||||||
|
#
|
||||||
|
# Ansible is free software: you can redistribute it and/or modify
|
||||||
|
# it under the terms of the GNU General Public License as published by
|
||||||
|
# the Free Software Foundation, either version 3 of the License, or
|
||||||
|
# (at your option) any later version.
|
||||||
|
#
|
||||||
|
# Ansible is distributed in the hope that it will be useful,
|
||||||
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
# GNU General Public License for more details.
|
||||||
|
#
|
||||||
|
# You should have received a copy of the GNU General Public License
|
||||||
|
# along with Ansible. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
|
||||||
|
import unittest
|
||||||
|
import botocore
|
||||||
|
import boto3
|
||||||
|
|
||||||
|
from ansible.module_utils.ec2 import AWSRetry
|
||||||
|
|
||||||
|
class RetryTestCase(unittest.TestCase):
|
||||||
|
|
||||||
|
def test_no_failures(self):
|
||||||
|
self.counter = 0
|
||||||
|
|
||||||
|
@AWSRetry.backoff(tries=2, delay=0.1)
|
||||||
|
def no_failures():
|
||||||
|
self.counter += 1
|
||||||
|
|
||||||
|
r = no_failures()
|
||||||
|
self.assertEqual(self.counter, 1)
|
||||||
|
|
||||||
|
def test_retry_once(self):
|
||||||
|
self.counter = 0
|
||||||
|
err_msg = {'Error': {'Code': 'InstanceId.NotFound'}}
|
||||||
|
|
||||||
|
@AWSRetry.backoff(tries=2, delay=0.1)
|
||||||
|
def retry_once():
|
||||||
|
self.counter += 1
|
||||||
|
if self.counter < 2:
|
||||||
|
raise botocore.exceptions.ClientError(err_msg, 'Could not find you')
|
||||||
|
else:
|
||||||
|
return 'success'
|
||||||
|
|
||||||
|
r = retry_once()
|
||||||
|
self.assertEqual(r, 'success')
|
||||||
|
self.assertEqual(self.counter, 2)
|
||||||
|
|
||||||
|
def test_reached_limit(self):
|
||||||
|
self.counter = 0
|
||||||
|
err_msg = {'Error': {'Code': 'RequestLimitExceeded'}}
|
||||||
|
|
||||||
|
@AWSRetry.backoff(tries=4, delay=0.1)
|
||||||
|
def fail():
|
||||||
|
self.counter += 1
|
||||||
|
raise botocore.exceptions.ClientError(err_msg, 'toooo fast!!')
|
||||||
|
|
||||||
|
#with self.assertRaises(botocore.exceptions.ClientError):
|
||||||
|
try:
|
||||||
|
fail()
|
||||||
|
except Exception as e:
|
||||||
|
self.assertEqual(e.response['Error']['Code'], 'RequestLimitExceeded')
|
||||||
|
self.assertEqual(self.counter, 4)
|
||||||
|
|
||||||
|
def test_unexpected_exception_does_not_retry(self):
|
||||||
|
self.counter = 0
|
||||||
|
err_msg = {'Error': {'Code': 'AuthFailure'}}
|
||||||
|
|
||||||
|
@AWSRetry.backoff(tries=4, delay=0.1)
|
||||||
|
def raise_unexpected_error():
|
||||||
|
self.counter += 1
|
||||||
|
raise botocore.exceptions.ClientError(err_msg, 'unexpected error')
|
||||||
|
|
||||||
|
#with self.assertRaises(botocore.exceptions.ClientError):
|
||||||
|
try:
|
||||||
|
raise_unexpected_error()
|
||||||
|
except Exception as e:
|
||||||
|
self.assertEqual(e.response['Error']['Code'], 'AuthFailure')
|
||||||
|
|
||||||
|
self.assertEqual(self.counter, 1)
|
||||||
|
|
||||||
|
if __name__ == '__main__':
|
||||||
|
unittest.main()
|
||||||
Loading…
Reference in New Issue