Files
oslo.service/oslo_service/backend/threading/loopingcall.py
Daniel Bengtsson 5de514f1f8 Add threading backend implementation using cotyledon and standard threads
Introduces a new threading backend for oslo.service that provides a
complete alternative to the eventlet-based backend.

This backend includes:
	• A ThreadGroup and Thread implementation using the Python
	  threading module.
	• A reimplementation of all looping call utilities (
	  FixedIntervalLoopingCall, DynamicLoopingCall, etc.) using
	  threading.Event and futurist.ThreadPoolExecutor.
	• A service management layer based on cotyledon, including
	  Service,ServiceWrapper, Launcher, and ProcessLauncher.
	• A new ThreadingBackend class that exposes all components
	  needed for integration into oslo.service.

This change provides a robust and eventlet-free alternative backend while maintaining API compatibility.

Change-Id: Ia7518401ccdcc28afbffd4ffe5c3b772f3617001
2025-05-14 14:03:04 +02:00

404 lines
14 KiB
Python

# Copyright (C) 2025 Red Hat, Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
# implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import functools
import random
import sys
import threading
import time
import futurist
from oslo_log import log as logging
from oslo_utils import excutils
from oslo_utils import reflection
from oslo_utils import timeutils
from oslo_service._i18n import _
LOG = logging.getLogger(__name__)
class LoopingCallDone(Exception):
"""Exception to break out and stop a LoopingCallBase.
The function passed to a looping call may raise this exception to
break out of the loop normally. An optional return value may be
provided; this value will be returned by LoopingCallBase.wait().
"""
def __init__(self, retvalue=True):
""":param retvalue: Value that LoopingCallBase.wait() should return."""
self.retvalue = retvalue
class LoopingCallTimeOut(Exception):
"""Exception raised when a LoopingCall times out."""
pass
class FutureEvent:
"""A simple event object that can carry a result or an exception."""
def __init__(self):
self._event = threading.Event()
self._result = None
self._exc_info = None
def send(self, result):
self._result = result
self._event.set()
def send_exception(self, exc_type, exc_value, tb):
self._exc_info = (exc_type, exc_value, tb)
self._event.set()
def wait(self, timeout=None):
flag = self._event.wait(timeout)
if not flag:
raise RuntimeError("Timed out waiting for event")
if self._exc_info:
exc_type, exc_value, tb = self._exc_info
raise exc_value.with_traceback(tb)
return self._result
def _safe_wrapper(f, kind, func_name):
"""Wrapper that calls the wrapped function and logs errors as needed."""
def func(*args, **kwargs):
try:
return f(*args, **kwargs)
except LoopingCallDone:
raise # Let the outer handler process this
except Exception:
LOG.error('%(kind)s %(func_name)r failed',
{'kind': kind, 'func_name': func_name},
exc_info=True)
return 0
return func
class LoopingCallBase:
_KIND = _("Unknown looping call")
_RUN_ONLY_ONE_MESSAGE = _(
"A looping call can only run one function at a time")
def __init__(self, f=None, *args, **kwargs):
self.args = args
self.kwargs = kwargs
self.f = f
self._future = None
self.done = None
self._abort = threading.Event() # When set, the loop stops
@property
def _running(self):
return not self._abort.is_set()
def stop(self):
if self._running:
self._abort.set()
def wait(self):
"""Wait for the looping call to complete and return its result."""
return self.done.wait()
def _on_done(self, future):
self._future = None
def _sleep(self, timeout):
# Instead of eventlet.sleep, we wait on the abort event for timeout
# seconds.
self._abort.wait(timeout)
def _start(self, idle_for, initial_delay=None, stop_on_exception=True):
"""Start the looping call.
:param idle_for: Callable taking two arguments (last result,
elapsed time) and returning how long to idle.
:param initial_delay: Delay (in seconds) before starting the
loop.
:param stop_on_exception: Whether to stop on exception.
:returns: A FutureEvent instance.
"""
if self._future is not None:
raise RuntimeError(self._RUN_ONLY_ONE_MESSAGE)
self.done = FutureEvent()
self._abort.clear()
def _run_loop():
kind = self._KIND
func_name = reflection.get_callable_name(self.f)
func = self.f if stop_on_exception else _safe_wrapper(self.f, kind,
func_name)
if initial_delay:
self._sleep(initial_delay)
try:
watch = timeutils.StopWatch()
while self._running:
watch.restart()
result = func(*self.args, **self.kwargs)
watch.stop()
if not self._running:
break
idle = idle_for(result, watch.elapsed())
LOG.debug(
'%(kind)s %(func_name)r sleeping for %(idle).02f'
' seconds',
{'func_name': func_name, 'idle': idle, 'kind': kind})
self._sleep(idle)
except LoopingCallDone as e:
self.done.send(e.retvalue)
except Exception:
exc_info = sys.exc_info()
try:
LOG.error('%(kind)s %(func_name)r failed',
{'kind': kind, 'func_name': func_name},
exc_info=exc_info)
self.done.send_exception(*exc_info)
finally:
del exc_info
return
else:
self.done.send(True)
# Use futurist's ThreadPoolExecutor to run the loop in a background
# thread.
executor = futurist.ThreadPoolExecutor(max_workers=1)
self._future = executor.submit(_run_loop)
self._future.add_done_callback(self._on_done)
return self.done
# NOTE: _elapsed() is a thin wrapper for StopWatch.elapsed()
def _elapsed(self, watch):
return watch.elapsed()
class FixedIntervalLoopingCall(LoopingCallBase):
"""A fixed interval looping call."""
_RUN_ONLY_ONE_MESSAGE = _(
"A fixed interval looping call can only run one function at a time")
_KIND = _('Fixed interval looping call')
def start(self, interval, initial_delay=None, stop_on_exception=True):
def _idle_for(result, elapsed):
delay = round(elapsed - interval, 2)
if delay > 0:
func_name = reflection.get_callable_name(self.f)
LOG.warning(
'Function %(func_name)r run outlasted interval by'
' %(delay).2f sec',
{'func_name': func_name, 'delay': delay})
return -delay if delay < 0 else 0
return self._start(_idle_for, initial_delay=initial_delay,
stop_on_exception=stop_on_exception)
class FixedIntervalWithTimeoutLoopingCall(LoopingCallBase):
"""A fixed interval looping call with timeout checking."""
_RUN_ONLY_ONE_MESSAGE = _(
"A fixed interval looping call with timeout checking"
" can only run one function at a time")
_KIND = _('Fixed interval looping call with timeout checking.')
def start(self, interval, initial_delay=None, stop_on_exception=True,
timeout=0):
start_time = time.time()
def _idle_for(result, elapsed):
delay = round(elapsed - interval, 2)
if delay > 0:
func_name = reflection.get_callable_name(self.f)
LOG.warning(
'Function %(func_name)r run outlasted interval by'
' %(delay).2f sec',
{'func_name': func_name, 'delay': delay})
elapsed_time = time.time() - start_time
if timeout > 0 and elapsed_time > timeout:
raise LoopingCallTimeOut(
_('Looping call timed out after %.02f seconds')
% elapsed_time)
return -delay if delay < 0 else 0
return self._start(_idle_for, initial_delay=initial_delay,
stop_on_exception=stop_on_exception)
class DynamicLoopingCall(LoopingCallBase):
"""A looping call which sleeps until the next known event.
The function called should return how long to sleep before being
called again.
"""
_RUN_ONLY_ONE_MESSAGE = _(
"A dynamic interval looping call can only run one function at a time")
_TASK_MISSING_SLEEP_VALUE_MESSAGE = _(
"A dynamic interval looping call should supply either an interval or"
" periodic_interval_max"
)
_KIND = _('Dynamic interval looping call')
def start(self, initial_delay=None, periodic_interval_max=None,
stop_on_exception=True):
def _idle_for(suggested_delay, elapsed):
delay = suggested_delay
if delay is None:
if periodic_interval_max is not None:
delay = periodic_interval_max
else:
raise RuntimeError(self._TASK_MISSING_SLEEP_VALUE_MESSAGE)
else:
if periodic_interval_max is not None:
delay = min(delay, periodic_interval_max)
return delay
return self._start(_idle_for, initial_delay=initial_delay,
stop_on_exception=stop_on_exception)
class BackOffLoopingCall(LoopingCallBase):
"""Run a method in a loop with backoff on error.
The provided function should return True (indicating success, which resets
the backoff interval), False (indicating an error, triggering a backoff),
or raise LoopingCallDone(retvalue=...) to quit the loop.
"""
_RNG = random.SystemRandom()
_KIND = _('Dynamic backoff interval looping call')
_RUN_ONLY_ONE_MESSAGE = _(
"A dynamic backoff interval looping call can only run one function at"
" a time")
def __init__(self, f=None, *args, **kwargs):
super().__init__(f=f, *args, **kwargs)
self._error_time = 0
self._interval = 1
def start(self, initial_delay=None, starting_interval=1, timeout=300,
max_interval=300, jitter=0.75, min_interval=0.001):
if self._future is not None:
raise RuntimeError(self._RUN_ONLY_ONE_MESSAGE)
# Reset state.
self._error_time = 0
self._interval = starting_interval
def _idle_for(success, _elapsed):
random_jitter = abs(self._RNG.gauss(jitter, 0.1))
if success:
# Reset error state on success.
self._interval = starting_interval
self._error_time = 0
return self._interval * random_jitter
else:
# Back off on error with jitter.
idle = max(self._interval * 2 * random_jitter, min_interval)
idle = min(idle, max_interval)
self._interval = max(self._interval * 2 * jitter, min_interval)
if timeout > 0 and self._error_time + idle > timeout:
raise LoopingCallTimeOut(
_('Looping call timed out after %.02f seconds') % (
self._error_time + idle))
self._error_time += idle
return idle
return self._start(_idle_for, initial_delay=initial_delay)
class RetryDecorator:
"""Decorator for retrying a function upon suggested exceptions.
The decorated function is retried for the given number of times,
with an incrementally increasing sleep time between retries. A max
sleep time may be set. If max_retry_count is -1, the function is
retried indefinitely until an exception is raised that is not in the
suggested exceptions.
"""
def __init__(self, max_retry_count=-1, inc_sleep_time=10,
max_sleep_time=60, exceptions=()):
"""Document parameters for retry behavior.
:param max_retry_count: Maximum number of retries for exceptions in
'exceptions'. -1 means retry indefinitely.
:param inc_sleep_time: Incremental sleep time (seconds) between
retries.
:param max_sleep_time: Maximum sleep time (seconds).
:param exceptions: A tuple of exception types to catch for retries.
"""
self._max_retry_count = max_retry_count
self._inc_sleep_time = inc_sleep_time
self._max_sleep_time = max_sleep_time
self._exceptions = exceptions
self._retry_count = 0
self._sleep_time = 0
def __call__(self, f):
func_name = reflection.get_callable_name(f)
def _func(*args, **kwargs):
try:
if self._retry_count:
LOG.debug(
"Invoking %(func_name)s; retry count is"
" %(retry_count)d.",
{'func_name': func_name,
'retry_count': self._retry_count})
result = f(*args, **kwargs)
except self._exceptions:
with excutils.save_and_reraise_exception() as ctxt:
LOG.debug(
"Exception in %(func_name)s occurred which is in the"
" retry list.",
{'func_name': func_name})
if (self._max_retry_count != -1 and
self._retry_count >= self._max_retry_count):
LOG.debug(
"Cannot retry %(func_name)s because retry count"
" (%(retry_count)d) reached max"
" (%(max_retry_count)d).",
{'retry_count': self._retry_count,
'max_retry_count': self._max_retry_count,
'func_name': func_name})
else:
ctxt.reraise = False
self._retry_count += 1
self._sleep_time += self._inc_sleep_time
return self._sleep_time
raise LoopingCallDone(result)
@functools.wraps(f)
def func(*args, **kwargs):
loop = DynamicLoopingCall(_func, *args, **kwargs)
evt = loop.start(periodic_interval_max=self._max_sleep_time)
LOG.debug("Waiting for function %s to return.", func_name)
return evt.wait()
return func