I hate Redis!
- Remove redis check from our health endpoint in prod entirely - Have the redis check have a maximum timeout of 1 second
This commit is contained in:
parent
ad53bf5671
commit
c518874ded
3 changed files with 22 additions and 10 deletions
|
@ -18,7 +18,11 @@ class RedisBuildLogs(object):
|
|||
PHASE = 'phase'
|
||||
|
||||
def __init__(self, redis_config):
|
||||
self._redis = redis.StrictRedis(socket_connect_timeout=5, **redis_config)
|
||||
args = dict(redis_config)
|
||||
args.update({'socket_connect_timeout': 5})
|
||||
|
||||
self._redis_config = redis_config
|
||||
self._redis = redis.StrictRedis(**args)
|
||||
|
||||
@staticmethod
|
||||
def _logs_key(build_id):
|
||||
|
@ -94,12 +98,16 @@ class RedisBuildLogs(object):
|
|||
|
||||
def check_health(self):
|
||||
try:
|
||||
if not self._redis.ping() == True:
|
||||
args = dict(self._redis_config)
|
||||
args.update({'socket_connect_timeout': 1, 'socket_timeout': 1})
|
||||
|
||||
connection = redis.StrictRedis(**args)
|
||||
if not connection.ping() == True:
|
||||
return False
|
||||
|
||||
# Ensure we can write and read a key.
|
||||
self._redis.set(self._health_key(), time.time())
|
||||
self._redis.get(self._health_key())
|
||||
connection.set(self._health_key(), time.time())
|
||||
connection.get(self._health_key())
|
||||
|
||||
return True
|
||||
except redis.ConnectionError:
|
||||
|
|
|
@ -10,16 +10,17 @@ def get_healthchecker(app, config_provider):
|
|||
|
||||
|
||||
class HealthCheck(object):
|
||||
def __init__(self, app, config_provider):
|
||||
def __init__(self, app, config_provider, instance_skips=None):
|
||||
self.app = app
|
||||
self.config_provider = config_provider
|
||||
self.instance_skips = instance_skips or []
|
||||
|
||||
def check_instance(self):
|
||||
"""
|
||||
Conducts a check on this specific instance, returning a dict representing the HealthCheck
|
||||
output and a number indicating the health check response code.
|
||||
"""
|
||||
service_statuses = check_all_services(self.app)
|
||||
service_statuses = check_all_services(self.app, skip=self.instance_skips)
|
||||
return self.get_instance_health(service_statuses)
|
||||
|
||||
def check_endtoend(self):
|
||||
|
@ -80,7 +81,7 @@ class LocalHealthCheck(HealthCheck):
|
|||
|
||||
class ProductionHealthCheck(HealthCheck):
|
||||
def __init__(self, app, config_provider, access_key, secret_key, db_instance='quay'):
|
||||
super(ProductionHealthCheck, self).__init__(app, config_provider)
|
||||
super(ProductionHealthCheck, self).__init__(app, config_provider, ['redis'])
|
||||
self.access_key = access_key
|
||||
self.secret_key = secret_key
|
||||
self.db_instance = db_instance
|
||||
|
@ -92,7 +93,7 @@ class ProductionHealthCheck(HealthCheck):
|
|||
def get_instance_health(self, service_statuses):
|
||||
# Note: We skip the redis check because if redis is down, we don't want ELB taking the
|
||||
# machines out of service. Redis is not considered a high avaliability-required service.
|
||||
skip = ['redis']
|
||||
skip = []
|
||||
notes = []
|
||||
|
||||
# If the database is marked as unhealthy, check the status of RDS directly. If RDS is
|
||||
|
|
|
@ -39,10 +39,13 @@ _SERVICES = {
|
|||
'redis': _check_redis
|
||||
}
|
||||
|
||||
def check_all_services(app):
|
||||
def check_all_services(app, skip):
|
||||
""" Returns a dictionary containing the status of all the services defined. """
|
||||
status = {}
|
||||
for name in _SERVICES:
|
||||
if name in skip:
|
||||
continue
|
||||
|
||||
status[name] = _SERVICES[name](app)
|
||||
|
||||
return status
|
Reference in a new issue