Source code for firexkit.task

import json
import re
import sys
import logging
import os
import textwrap
from collections import OrderedDict
import inspect
from datetime import datetime
from functools import partial
from typing import Callable, Iterable, Optional, Union, Any, Mapping, Sequence
from urllib.parse import urljoin
from copy import deepcopy
import dataclasses
import enum
import typing
import time

import pydantic

from celery.result import AsyncResult
from contextlib import contextmanager
from enum import Enum
from logging.handlers import WatchedFileHandler
from types import MethodType, MappingProxyType
from celery.app.task import Task
from celery.local import PromiseProxy
from celery.utils.log import get_task_logger, get_logger
import celery.signals

from firexkit.bag_of_goodies import BagOfGoodies, AutoInjectRegistry, AutoInjectSpec, AutoInject
from firexkit.argument_conversion import ConverterRegister
from firexkit.result import (
    get_tasks_names_from_results, wait_for_any_results,
    wait_on_async_results_and_maybe_raise, get_result_logging_name, ChainInterruptedException,
    ChainRevokedException, last_causing_chain_interrupted_exception,
    wait_for_running_tasks_from_results, WaitOnChainTimeoutError, get_results,
    get_task_name_from_result, first_non_chain_interrupted_exception, forget_chain_results,
    DYNAMIC_RETURN, ReturnsCodingException, FireXResults
)
from firexkit.resources import get_firex_css_filepath, get_firex_logo_filepath
from firexkit.firexkit_common import JINJA_ENV
from firexkit.chain import InjectArgs, SignatureX

ADDITIONAL_CHILDREN_KEY = 'additional_children'
REPLACEMENT_TASK_NAME_POSTFIX = '_orig'

REDIS_DB_KEY_FOR_RESULTS_WITH_REPORTS = 'FIREX_RESULTS_WITH_REPORTS'
REDIS_DB_KEY_PREFIX_FOR_ENQUEUE_ONCE_UID = 'ENQUEUE_CHILD_ONCE_UID_'
REDIS_DB_KEY_PREFIX_FOR_ENQUEUE_ONCE_COUNT = 'ENQUEUE_CHILD_ONCE_COUNT_'
REDIS_DB_KEY_PREFIX_FOR_CACHE_ENABLED_UID = 'CACHE_ENABLED'

logger = get_task_logger(__name__)



[docs]
@dataclasses.dataclass
class TaskEnqueueSpec:
    signature: SignatureX
    inject_abog: bool = True
    enqueue_opts: Optional[dict[str, Any]] = None





[docs]
class NotInCache(Exception):
    pass




[docs]
class CacheResultNotPopulatedYetInRedis(NotInCache):
    pass



def _nop():
    pass


def _empty_bog() -> BagOfGoodies:
    return BagOfGoodies(inspect.signature(_nop), tuple(), {})



[docs]
@dataclasses.dataclass
class TaskContext:
    bog: BagOfGoodies
    flame_configs: dict = dataclasses.field(default_factory=dict)
    enqueued_children: dict[AsyncResult, dict] = dataclasses.field(default_factory=dict)
    bog: BagOfGoodies = dataclasses.field(default_factory=_empty_bog)

    _auto_in_reg: Optional[AutoInjectRegistry] = None
    _pause_tasks: Optional['PauseTasks'] = None


[docs]
    def auto_inject_reg(self) -> AutoInjectRegistry:
        if self._auto_in_reg is None:
            self._auto_in_reg = self.bog.get_auto_inject_registry()
        return self._auto_in_reg



[docs]
    def pause_tasks(self) -> 'PauseTasks':
        if self._pause_tasks is None:
            self._pause_tasks : PauseTasks = self.auto_inject_reg().get(
                PauseTasks.PAUSE_TASKS_ABOG_KEY,
                PauseTasks({}, False),
            )
        return self._pause_tasks





[docs]
class PendingChildStrategy(Enum):
    """
    Available strategies for handling remaining pending child tasks upon successful completion
    of the parent microservice.
    """

    Block = 0, "Default"
    Revoke = 1
    Continue = 2





[docs]
class IllegalTaskNameException(Exception):
    pass




[docs]
def create_collapse_ops(flex_collapse_ops_spec):
    from typing import Pattern

    if isinstance(flex_collapse_ops_spec, list):
        return flex_collapse_ops_spec

    result_ops = []
    if isinstance(flex_collapse_ops_spec, dict):
        for k, v in flex_collapse_ops_spec.items():
            op = {}
            if isinstance(k, str):
                op['relative_to_nodes'] = {'type': 'task_name', 'value': k}
            elif issubclass(type(k), Pattern):  # can't use isinstance till 3.6
                op['relative_to_nodes'] = {'type': 'task_name_regex', 'value': k.pattern}

            if isinstance(v, str):
                op['targets'] = [v]
            elif isinstance(v, list):
                op['targets'] = v
            elif isinstance(v, dict):
                # take targets, operation from value.
                op.update(v)

            if 'targets' in op:
                result_ops.append(op)
            else:
                # TODO: fail or ignore malformed specs?
                pass
    elif isinstance(flex_collapse_ops_spec, str):
        result_ops.append({'targets': [flex_collapse_ops_spec]})

    return result_ops




[docs]
def expand_self_op():
    return {'operation': 'expand', 'targets': ['self']}



FLAME_COLLAPSE_KEY = '_default_display'



[docs]
def flame_collapse_formatter(ops, task):
    filled_ops = []
    for op in ops:
        if 'targets' not in op or not isinstance(op['targets'], list):
            # Ignore malformed operations.
            continue
        filled_op = {
            # defaults.
            'relative_to_nodes': {'type': 'task_uuid', 'value': task.request.id},
            'source_node': {'type': 'task_uuid', 'value': task.request.id},
            'operation': 'collapse',
        }
        filled_op.update(op)
        filled_ops.append(filled_op)
    return filled_ops




[docs]
def flame_collapse(flex_collapse_ops):
    static_ops = create_collapse_ops(flex_collapse_ops)
    return flame(FLAME_COLLAPSE_KEY, flame_collapse_formatter, data_type='object', bind=True, on_next=True,
                 on_next_args=[static_ops], decorator_name=flame_collapse.__name__)



def _default_flame_formatter(data):
    if data is None:
        return None
    if not isinstance(data, str):
        try:
            return json.dumps(data)
        except TypeError:
            return str(data)
    return data



[docs]
def create_flame_config(existing_configs, formatter=_default_flame_formatter, data_type='html', bind=False,
                        on_next=False, on_next_args=()):
    return {'formatter': formatter,
            'data_type': data_type,
            'bind': bind,
            'on_next': on_next,
            'on_next_args': on_next_args,
            'order': max([c['order'] for c in existing_configs],
                         default=-1) + 1,
            }



[docs]
def flame(flame_key=None, formatter=_default_flame_formatter, data_type='html', bind=False, on_next=False,
          on_next_args=(), decorator_name='flame'):
    def decorator(func):
        if type(func) is PromiseProxy:
            raise Exception(f"@{decorator_name} must be applied to a function (after @app.task) on {func.__name__}")

        undecorated = undecorate_func(func)
        if not hasattr(undecorated, 'flame_data_configs'):
            undecorated.flame_data_configs = OrderedDict()
        undecorated.flame_data_configs[flame_key] = create_flame_config(undecorated.flame_data_configs.values(),
                                                                        formatter, data_type, bind, on_next,
                                                                        on_next_args)
        return func

    return decorator


def _set_taskid_in_db_key(result: AsyncResult, db, db_key):
    db.set(db_key, result.id)
    logger.debug(f'Key {db_key} set to {result.id}')


[docs]
def get_cache_enabled_uid_dbkey(cache_key_info: str) -> str:
    return f'{REDIS_DB_KEY_PREFIX_FOR_CACHE_ENABLED_UID}{cache_key_info}'




[docs]
def get_enqueue_child_once_uid_dbkey(enqueue_once_key: str) -> str:
    return f'{REDIS_DB_KEY_PREFIX_FOR_ENQUEUE_ONCE_UID}{enqueue_once_key}'




[docs]
def get_enqueue_child_once_count_dbkey(enqueue_once_key: str) -> str:
    return f'{REDIS_DB_KEY_PREFIX_FOR_ENQUEUE_ONCE_COUNT}{enqueue_once_key}'




[docs]
def get_current_enqueue_child_once_uid_dbkeys(db) -> list[str]:
    return db.client.keys(get_enqueue_child_once_uid_dbkey('*'))




[docs]
def get_current_cache_enabled_uid_dbkeys(db) -> list[str]:
    return db.client.keys(get_cache_enabled_uid_dbkey('*'))




[docs]
def get_current_enqueue_child_once_uids(db) -> set[str]:
    """Returns a set of all task/result ids that were executed with enqueue_once"""

    # First, we need to find all the enqueue_once keys
    keys = get_current_enqueue_child_once_uid_dbkeys(db)
    # Then we get the task/result ids stored in those keys
    return {v.decode() for v in db.mget(keys)}




[docs]
def get_current_cache_enabled_uids(db) -> set[str]:
    """Returns a set of all task/result ids whose tasks were cache-enabled"""

    # First, we need to find all the cache_enabled keys
    keys = get_current_cache_enabled_uid_dbkeys(db)
    # Then we get the task/result ids stored in those keys
    return {v.decode() for v in db.mget(keys)}




[docs]
def add_task_result_with_report_to_db(db, result_id: str):
    """Append task id to the list of tasks with reports (e.g. tasks decorated with @email)"""
    db.client.rpush(REDIS_DB_KEY_FOR_RESULTS_WITH_REPORTS, result_id)




[docs]
def get_current_reports_uids(db) -> set[str]:
    """Return the list of task/results ids for all tasks with reports (e.g. @email) executed so far"""
    return {v.decode() for v in db.client.lrange(REDIS_DB_KEY_FOR_RESULTS_WITH_REPORTS, 0, -1)}




[docs]
class FireXTask(Task):
    """
    Task object that facilitates passing of arguments and return values from one task to another, to be used in chains
    """
    DYNAMIC_RETURN = DYNAMIC_RETURN

    # prevent clients from needing to know about bag_of_goodes module.
    AutoInject = AutoInject

    def __init__(self):

        check_name_for_override_posfix = getattr(self, 'check_name_for_override_posfix', True)
        if check_name_for_override_posfix and self.name and self.name.endswith(REPLACEMENT_TASK_NAME_POSTFIX):
            raise IllegalTaskNameException(f'Task names should never end with {REPLACEMENT_TASK_NAME_POSTFIX!r}')

        self.undecorated = undecorate(self)
        self.sig = inspect.signature(self.run)

        _task_return_keys = self._get_task_return_keys()
        _decorated_return_keys = getattr(self.undecorated, "_decorated_return_keys", None)
        if _decorated_return_keys and _task_return_keys:
            raise ReturnsCodingException(f"You can't specify both a @returns decorator and a returns in the app task for {self.name}")
        self._return_keys : Optional[tuple[str, ...]] = _decorated_return_keys or _task_return_keys

        self._lagging_children_strategy = get_attr_unwrapped(self, 'pending_child_strategy', PendingChildStrategy.Block)

        super(FireXTask, self).__init__()

        self._in_required : Optional[set[str]] = None
        self._in_optional : Optional[dict[str, Any]] = None

        self._logs_dir_for_worker = None
        self._file_logging_dir_path = None
        self._task_logging_dirpath = None
        self._temp_loghandlers = None
        self.code_filepath = self.get_module_file_location()

        self._from_plugin = False
        self.context : TaskContext = TaskContext(BagOfGoodies(self.sig, tuple(), {}))
        self.name : str

        # when this task is overriden, this is the most immediately preceding overridden task,
        # or None when the current task is not an override.
        self.orig: Optional[FireXTask] = None

    @property
    def return_keys(self) -> tuple[str, ...]:
        return self._return_keys or tuple()


[docs]
    def get_overridden_task(self) -> 'FireXTask':
        if not self.is_overriding_task():
            raise TypeError(f'{self.name} does not override a task')
        assert self.orig
        return self.orig


    @property
    def root_orig(self) -> 'FireXTask':
        """Return the very original `Task` that this `Task` had overridden.
        If this task has been overridden multiple times, this will return the very first/original task.
        Return `self` if the task was not overridden"""
        if ( orig_task := getattr(self, "orig", None) ):
            return orig_task.root_orig
        return self


[docs]
    def is_overriding_task(self) -> bool:
        return self.root_orig != self



[docs]
    def apply_async(self, *args, **kwargs):
        original_name = self.name
        if self.from_plugin and not original_name.endswith(REPLACEMENT_TASK_NAME_POSTFIX):
            # If the task is overridden, and is not an intermediate override, then
            # let's use the original name for serialization, in case that
            # override name isn't available in the execution context.
            # This can obviously be dangerous (but a risk we're deliberately taking)
            # since we bind the args/kwargs/runtime options with the ovverriden service
            # but might end up executing in a context that doesn't have it.
            self.name = self.root_orig.name_without_orig
        try:
            res = super(FireXTask, self).apply_async(*args, **kwargs)
        finally:
            # Restore the original name
            self.name = original_name
        return res



[docs]
    def signature(self, *args, **kwargs):
        # We need to lookup the task, in case it was over-ridden by a plugin
        try:
            new_self = self.app.tasks[self.name]
        except Exception:
            # TODO: WTH
            # Some caching issue prevent tests from running
            # These tests should really run in forked processes (or use Celery PyTest fixtures)
            # Otherwise, seems that everything is global
            new_self = self.app.tasks[self.name]
        # Get the signature from the new_self
        return super(FireXTask, new_self).signature(*args, **kwargs)


    @contextmanager
    def _task_context(self, args: tuple[Any, ...], kwargs: dict[str, Any]):
        try:
            self.context = self.initialize_context(
                # Flame configs need to be on self.context b/c they write to flame_data_configs[k]['on_next'] for collapse ops.
                # Might make more sense to rework that to avoid flame data on context.
                flame_configs=self._get_task_flame_configs(),
                # Organise the input args by creating a BagOfGoodies
                bog=BagOfGoodies(self.sig, args, kwargs)
            )
            yield
        finally:
            # restore empty context to avoid pointless defensive coding.
            self.context = TaskContext(BagOfGoodies(self.sig, tuple(), {}))

    @property
    def from_plugin(self):
        return self._from_plugin

    @property
    def task_label(self) -> str:
        """Returns a label for this task

        Examples:
            8345379a-e536-4566-b5c9-3d515ec5936a
            8345379a-e536-4566-b5c9-3d515ec5936a_2 (if it was the second retry)
            microservices.testsuites_tasks.CreateWorkerConfigFromTestsuites (if there was no request id yet)
        """
        label = str(self.request.id) if self.request.id else self.name
        label += '_%d' % self.request.retries if self.request.retries >= 1 else ''
        return label

    @property
    def request_soft_time_limit(self):
        return self.request.timelimit[1]

    @from_plugin.setter
    def from_plugin(self, value):
        self._from_plugin = value


[docs]
    def initialize_context(self, flame_configs: dict, bog: BagOfGoodies) -> TaskContext:
        return TaskContext(
            flame_configs=flame_configs,
            bog=bog,
        )



[docs]
    def get_module_file_location(self):
        return sys.modules[self.__module__].__file__



[docs]
    @classmethod
    def is_dynamic_return(cls, value: str) -> bool:
        return hasattr(value, 'startswith') and value.startswith(cls.DYNAMIC_RETURN)


    def _get_task_return_keys(self) -> Optional[tuple[str, ...]]:
        task_return_keys = get_attr_unwrapped(self, 'returns', None)
        if task_return_keys is not None:
            if isinstance(task_return_keys, str):
                task_return_keys = (task_return_keys, )

            explicit_keys = [k for k in task_return_keys if not self.is_dynamic_return(k)]
            if len(explicit_keys) != len(set(explicit_keys)):
                raise ReturnsCodingException(f"{self.name} has duplicate explicit return keys")

            if not isinstance(task_return_keys, tuple):
                task_return_keys = tuple(task_return_keys)

        return task_return_keys


[docs]
    def run(self, *args, **kwargs):
        """The body of the task executed by workers."""
        raise NotImplementedError('Tasks must define the run method.')



[docs]
    @staticmethod
    def strip_orig_from_name(task_name):
        return re.sub(f"({REPLACEMENT_TASK_NAME_POSTFIX})*$", "", task_name)



[docs]
    @staticmethod
    def get_short_name(task_name):
        # Task name of first task in chain. (I.E. 'task1' in module1.task1|module2.task2)
        return task_name.split('|')[0].split('.')[-1]



[docs]
    @classmethod
    def get_short_name_without_orig(cls, task_name):
        return cls.strip_orig_from_name(cls.get_short_name(task_name))


    @property
    def name_without_orig(self):
        return self.strip_orig_from_name(self.name)

    @property
    def short_name(self):
        return self.get_short_name(self.name)

    @property
    def short_name_without_orig(self):
        return self.get_short_name_without_orig(self.name)

    @property
    def called_as_orig(self):
        return True if self.name.endswith(REPLACEMENT_TASK_NAME_POSTFIX) else False


[docs]
    def has_report_meta(self) -> bool:
        """Does this task generate a report (e.g. decorated with @email)?"""
        return hasattr(self, 'report_meta')



[docs]
    def add_task_result_with_report_to_db(self):
        """Maintain a list in the backend of all executed tasks that will generate reports"""
        return add_task_result_with_report_to_db(self.app.backend,  self.request.id)



[docs]
    def pre_task_run(self, extra_events: Optional[dict] = None):
        """
        Overrideable method to allow subclasses to do something with the
        BagOfGoodies before returning the results
        """

        # Send a custom task-started-info event with essential meta-data
        # and a task-args event with the args
        if not self.request.called_directly:
            if self.has_report_meta():
                # If the task generates a report, append the task id
                # to the list in the backend of all executed tasks that  generate reports
                self.add_task_result_with_report_to_db()

            self.send_event(
                'task-started-info',
                called_as_orig=self.called_as_orig,
                long_name=self.name_without_orig,
                log_filepath=self.task_log_url,
                from_plugin=self.from_plugin,
                code_filepath=self.code_filepath,
                retries=self.request.retries,
                task_parent_id=self.request.parent_id,
                **(extra_events or {}),
            )

            self.send_event(
                'task-args',
                firex_bound_args=convert_to_serializable(self.bound_args),
                firex_default_bound_args=convert_to_serializable(self.default_bound_args),
            )
            self.send_flame(self.abog)

        # Print the pre-call header
        self._print_precall_header()
        self._log_soft_time_limit_override_if_applicable()


    def _log_soft_time_limit_override_if_applicable(self):
        if not self.request.called_directly:
            if self.soft_time_limit != self.request_soft_time_limit:
                logger.debug(f'This task default soft_time_limit of '
                             f'{self.soft_time_limit}{"s" if self.soft_time_limit is not None else ""} '
                             f'was over-ridden to {self.request_soft_time_limit}s')
            elif self.soft_time_limit is not None:
                logger.debug(f'This task soft_time_limit is {self.soft_time_limit}s')

    def _print_precall_header(self):
        n = 1
        content = ''
        args_list = []
        for postfix, args in zip(['', ' (default)'], [self.bound_args, self.default_bound_args]):
            for k, v in (args or {}).items():
                args_list.append('  %d. %s: %r%s' % (n, k, v, postfix))
                n += 1
        if args_list:
            content = 'ARGUMENTS\n' + '\n'.join(args_list)

        task_name = self.name
        if self.from_plugin:
            task_name += ' (PLUGIN)'

        logger.debug(
            banner(f'STARTED: {task_name}', content=content, length=100),
            extra={'label': self.task_label, 'span_class': 'task_started'},
        )


[docs]
    def print_postcall_header(self, result):
        content = ''
        results_list = []
        if result:
            if isinstance(result, dict):
                n = 1
                for k, v in result.items():
                    results_list.append('  %d. %s: %r' % (n, k, v))
                    n += 1
            else:
                results_list.append(f'  {result!r}')
        if results_list:
            content = 'RETURNS\n' + '\n'.join(results_list)
        logger.debug(banner('COMPLETED: %s' % self.name, ch='*', content=content, length=100),
                     extra={'span_class': 'task_completed'})


    def __call__(self, *args, **kwargs) -> dict[str, Any]:
        """
        This method should not be overridden since it provides the context (i.e., run state).
        Classes extending FireX should override the _call.
        """
        with self._task_context(args, kwargs):
            return self._call(*args, **kwargs)

    def _call(self, *args, **kwargs) -> dict[str, Any]:
        if not self.request.called_directly:
            self.add_task_logfile_handler()

        try:
            converted_result = self._process_arguments_and_run(*args, **kwargs)

            if self._lagging_children_strategy is PendingChildStrategy.Block:
                try:
                    self.wait_for_children()
                except Exception as e:
                    logger.debug("The following exception was thrown (and caught) when wait_for_children was "
                                 "implicitly called by this task's base class:\n" + str(e))
            return converted_result
        except Exception as e:
            self.handle_exception(e)
        finally:
            try:
                if self._lagging_children_strategy is not PendingChildStrategy.Continue:
                    self.revoke_nonready_children()
            finally:
                self.remove_task_logfile_handler()


[docs]
    def handle_exception(self, e, logging_extra: Optional[dict]=None):
        extra = {'span_class': 'exception'} | (logging_extra or {})

        if isinstance(e, ChainInterruptedException) or isinstance(e, ChainRevokedException):
            try:
                causing_e = last_causing_chain_interrupted_exception(e)
                exception_cause_uuid = causing_e.task_id
            except AttributeError:
                pass
            else:
                if exception_cause_uuid:
                    self.send_event('task-exception-cause', exception_cause_uuid=exception_cause_uuid)
        mssg = f'{type(e).__name__}'
        exception_string = str(e)
        if exception_string:
            mssg += f': {exception_string}'
        logger.error(mssg, exc_info=e, extra=extra)
        raise e


    def _process_result(
        self,
        result: dict[str, Any],
        extra_events: Optional[dict]=None,
    ) -> dict[str, Any]:

        post_run_return_args = self.context.bog.all_supplied_args() | result

        # run any post converters attached to this task
        converted_return_args = ConverterRegister.task_convert(
            self.name,
            pre_task=False,
            **BagOfGoodies.resolve_indirect(post_run_return_args)
        )
        indirect_resolved_converted_return_args = BagOfGoodies.resolve_indirect(converted_return_args)

        converted_task_results = {
            k: v for k, v in indirect_resolved_converted_return_args.items()
            if (
                k in result # only results for service, not all supplied arg +
                and k not in BagOfGoodies.infra_return_keys() # hide infra keys
            )
        }

        # Print the post-call header
        self.print_postcall_header(converted_task_results)

        # Send a custom task-succeeded event with the results
        if not self.request.called_directly:
            self.send_event(
                'task-results',
                firex_result=convert_to_serializable(converted_task_results),
                **(extra_events or {}),
            )
            self.send_flame(indirect_resolved_converted_return_args)

        return indirect_resolved_converted_return_args

    def _get_cache_key(self):
        # Need a sting hash of name + all_args
        return get_cache_enabled_uid_dbkey(str((self.name,) + tuple(sorted(self.all_args.items()))))

    def _cache_get(self, cache_key):
        cached_uuid = self.backend.get(cache_key)
        if cached_uuid is None:
            raise NotInCache()
        cached_uuid = cached_uuid.decode()
        logger.info(f'[Caching] found entry for key {cache_key!r} at {cached_uuid!r}')
        return cached_uuid

    def _cache_set(self, cache_key, uuid):
        # We need to just store a reference  to the uuid (no need to store the result again)
        logger.debug(f'[Caching] storing entry for key {cache_key!r} -> {uuid!r}')
        self.backend.set(cache_key, uuid)

    @classmethod
    def _retrieve_result_from_backend(
        cls,
        cached_uuid,
        secs_to_wait_for_cached_result: int=3,
    ) -> dict[str, Any]:
        # Retrieve the result of the original cached uuid from the backend
        logger.info(f'Retrieving result for {cached_uuid}; might take up to {secs_to_wait_for_cached_result} seconds.')
        loop_start_time = current_time = time.time()
        while (current_time - loop_start_time) < secs_to_wait_for_cached_result:
            result : dict[str, Any] = cls.app.backend.get_result(cached_uuid)
            if set(result.keys()) != {'hostname', 'pid'}:
                # When the result is not populated, we get a dict back with these two keys
                break # --< We're done
            else:
                logger.debug('Result not populated yet!')
                time.sleep(0.1)
                current_time = time.time()
        else:
            raise CacheResultNotPopulatedYetInRedis(f'result for {cached_uuid} not populated '
                                                    f'in redis after {secs_to_wait_for_cached_result}s')
        return result

    @classmethod
    def _run_from_cache(cls, cached_uuid) -> dict[str, Any]:
        result = cls._retrieve_result_from_backend(cached_uuid)
        cached_result_return_keys = result.get('__task_return_keys', ()) + ('__task_return_keys',)
        return {
            k: v for k, v in result.items()
            if k in cached_result_return_keys
        }

    @property
    def default_use_cache(self):
        return getattr(self, 'use_cache', None)


[docs]
    def is_cache_enabled(self):
        use_cache_value = self.default_use_cache
        if not self.request.called_directly:
            try:
                request_use_cache = self.request.properties['use_cache']
            except KeyError:
                pass
            else:
                if request_use_cache is not None:
                    if request_use_cache != self.default_use_cache:
                        logger.debug(f'use_cache default value of {self.default_use_cache!r} for task {self.name!r} '
                                     f'was overridden by enqueue to {request_use_cache!r}')
                    use_cache_value = request_use_cache
        return bool(use_cache_value)


    def _real_call_and_cache_set(self, cache_key):
        result = self.real_call()
        self._cache_set(cache_key, self.request.id)
        return result


[docs]
    def cache_call(self) -> dict[str, Any]:
        cache_key = self._get_cache_key()
        try:
            cached_uuid = self._cache_get(cache_key)
        except NotInCache:
            logger.debug(f'[Caching] No entry found for key {cache_key!r}')
            return self._real_call_and_cache_set(cache_key)
        else:
            try:
                result = self._run_from_cache(cached_uuid)
            except CacheResultNotPopulatedYetInRedis:
                logger.debug('[Caching] Cache result not populated yet in Redis. '
                             'Reverting to a real call')
                return self._real_call_and_cache_set(cache_key)
            else:
                return self._process_result(
                    result,
                    extra_events={'cached_result_from': cached_uuid})


    def _find_applicable_overriding_return_keys(
        self,
        results_tuple: tuple[Any, ...],
    ) -> tuple[str, ...]:
        result_count = len(results_tuple)
        if (
            # integration tests rely on no validation for implicit dynamic returns :/
            # so assume DYNAMIC_RETURN if it looks like it
            self._return_keys is None
            and result_count == 1
            and isinstance(results_tuple[0], dict)
        ):
            return (DYNAMIC_RETURN,)

        if (
            not self.is_overriding_task() # base case in recursion
            # lots of IT have plugins that violate overriden task returns contract
            # by returning nothing, which is bad but needs needs to be accomodated.
            # TODO: "strict" should disallow this.
            or result_count == len(self._return_keys or [])
        ):
            return self.return_keys

        # return overridden result.
        return self.get_overridden_task()._find_applicable_overriding_return_keys(results_tuple)


[docs]
    def real_call(self) -> dict[str, Any]:
        # this is the raw result from the service's .run method,
        # prior to all FireX processing.
        _call_run_result : Any = super(FireXTask, self).__call__(
            *self.context.bog.args,
            **self.context.bog.kwargs)

        results_tuple = FireXResults.task_returns_to_tuple(self.return_keys, _call_run_result)
        applicable_return_keys = self._find_applicable_overriding_return_keys(results_tuple)

        return self._process_result(
            FireXResults.convert_result_tuple_to_dict(applicable_return_keys, results_tuple)
        )



[docs]
    def final_call(self) -> dict[str, Any]:
        if self.is_cache_enabled():
            return self.cache_call()
        else:
            return self.real_call()


    def _process_arguments_and_run(self, *args, **kwargs) -> dict[str, Any]:

        # run any "pre" converters attached to this task
        self.context.bog.update(
            ConverterRegister.task_convert(
                task_name=self.name,
                pre_task=True,
                **self.context.bog.get_public_supplied_args())
        )

        if not self.request.called_directly:
            self._pause_if_point_requested(_PausePoints.PAUSE_BEFORE)

        # give sub-classes a chance to do something with the args
        self.pre_task_run()
        try:
            return self.final_call()
        except Exception:
            self._pause_if_point_requested(_PausePoints.PAUSE_ON_FAILURE)
            raise
        finally:
            self._pause_if_point_requested(_PausePoints.PAUSE_AFTER)

    def _pause_if_point_requested(self, p: '_PausePoints'):
        pause_req = self.context.pause_tasks().pause_point_requested(self.short_name, p)
        if pause_req:
            pause_task_name = self.app.conf.get("pause_task") or 'firexapp.tasks.core_tasks.Pause'
            pause_task = self.app.tasks[pause_task_name]
            self.enqueue_child(
                pause_task.s(
                    **(
                        dict(
                            pause_hours=pause_req.pause_hours,
                            pause_point=pause_req.pause_point,
                            send_pause_email_notification=self.context.pause_tasks().send_pause_email_notification,
                        ) | self.abog
                    )
                ),
                block=True,
                raise_exception_on_failure=False,
            )
            _set_task_start_time(self, force=True)


[docs]
    def retry(self, *args, **kwargs):
        # Adds some logging to the original task retry

        if not self.request.called_directly:
            if self.request.retries == self.max_retries:
                logger.error(f'{self.short_name} failed all {self.max_retries} retry attempts')
            else:
                logger.warning(f'{self.short_name} failed and retrying {self.request.retries+1}/{self.max_retries}')
        super(FireXTask, self).retry(*args, **kwargs)


    @property
    def required_args(self) -> list[str]:
        """
        :return: list of required arguments to the microservice.
        """
        if self._in_required is None:
            self._in_required = self.context.bog.get_required_arg_names()
        return list(self._in_required)

    @property
    def optional_args(self) -> dict:
        """
        :return: dict of optional arguments to the microservice, and their values.
        """
        if self._in_optional is None:
            self._in_optional = self.context.bog.get_optional_args_to_default_values()
        return dict(self._in_optional)

    @property
    def args(self) -> tuple[Any, ...]:
        return self.context.bog.args

    @property
    def kwargs(self) -> dict[str, Any]:
        return self.context.bog.kwargs

    @property
    def bound_args(self) -> dict[str, Any]:
        return self.sig.bind_partial(
            *self.context.bog.args,
            **self.context.bog.kwargs,
        ).arguments

    @property
    def default_bound_args(self) -> dict[str, Any]:
        return self.context.bog.get_unsupplied_default_args()


[docs]
    def map_args(self, *args, **kwargs) -> dict:
        return BagOfGoodies(
            self.sig, args, kwargs,
        ).get_accepted_supplied_and_default_args()


    @property
    def all_args(self) -> MappingProxyType:
        return MappingProxyType(self.bound_args | self.default_bound_args)

    @property
    def abog(self) -> MappingProxyType[str, Any]:
        # TODO: actually change to MappingProxyType? DictWillNotAllowWrites was in place for years.
        return self.default_bound_args | self.context.bog.get_public_supplied_args()

    def _get_infra_abog(self) -> MappingProxyType[str, Any]:
        return self.default_bound_args | self.context.bog.all_supplied_args()

    def _get_auto_injected_arg(self, arg_name: str):
        return self.context.auto_inject_reg().get(arg_name)

    @property
    def uid(self):
        # services should always declare "uid: AutoInject[Uid]" as an arg to automatically receive
        # a Uid, but since we have this legacy mechanism, use auto_inject_reg
        # to always supply the Uid
        return self._get_auto_injected_arg('uid')

    #######################
    # Enqueuing child tasks

    _STATE_KEY = 'state'
    _PENDING = 'pending'
    _UNBLOCKED = 'unblocked'

    @property
    def enqueued_children(self) -> list[AsyncResult]:
        return list(self.context.enqueued_children.keys())

    @property
    def pending_enqueued_children(self):
        return [child for child, result in self.context.enqueued_children.items() if
                result.get(self._STATE_KEY) == self._PENDING]

    @property
    def nonready_enqueued_children(self):
        return [child for child in self.context.enqueued_children if not child.ready()]

    def _add_enqueued_child(self, child_result: AsyncResult):
        if child_result not in self.context.enqueued_children:
            self.context.enqueued_children[child_result] = {}

    def _remove_enqueued_child(self, child_result: AsyncResult):
        if child_result in self.context.enqueued_children:
            del(self.context.enqueued_children[child_result])

    def _update_child_state(self, child_result: AsyncResult, state: str):
        if child_result not in self.context.enqueued_children:
            self._add_enqueued_child(child_result)
        self.context.enqueued_children[child_result][self._STATE_KEY] = state


[docs]
    def wait_for_any_children(self, pending_only=True, **kwargs):
        """Wait for any of the enqueued child tasks to run and complete"""
        child_results = self.pending_enqueued_children if pending_only else self.enqueued_children
        for completed_child_result in wait_for_any_results(child_results, **kwargs):
            self._update_child_state(completed_child_result, self._UNBLOCKED)
            yield completed_child_result



[docs]
    def wait_for_children(self, pending_only=True, **kwargs):
        """Wait for all enqueued child tasks to run and complete"""
        child_results = self.pending_enqueued_children if pending_only else self.enqueued_children
        self.wait_for_specific_children(
            child_results=child_results,
            **kwargs,
        )


    def _forget_child_result(self, child_result: AsyncResult):

        """Forget results of the tree rooted at the "chain-head" of child_result, while skipping subtrees in
        skip_subtree_nodes, as well as nodes in do_not_forget_nodes.

        """
        logger.debug('Forgetting results')

        skip_subtree_nodes: set[str] = set()

        enqueue_once_subtree_nodes = get_current_enqueue_child_once_uids(self.backend)
        if enqueue_once_subtree_nodes:
            skip_subtree_nodes.update(enqueue_once_subtree_nodes)
            logger.debug(f'Enqueue once subtree nodes: {enqueue_once_subtree_nodes}')

        cache_enabled_subtree_nodes = get_current_cache_enabled_uids(self.backend)
        if cache_enabled_subtree_nodes:
            skip_subtree_nodes.update(cache_enabled_subtree_nodes)
            logger.debug(f'Cache-enabled  subtree nodes: {cache_enabled_subtree_nodes}')

        report_nodes = get_current_reports_uids(self.backend)
        if report_nodes:
            logger.debug(f'Report nodes: {report_nodes}')

        forget_chain_results(
            child_result,
            skip_subtree_nodes=skip_subtree_nodes,
            do_not_forget_nodes=report_nodes,
        )
        # Since we forget the child, we need to also remove it from the list of enqueued_children
        self._remove_enqueued_child(child_result)


[docs]
    def forget_specific_children_results(self, child_results: list[AsyncResult]):
        """Forget results for the explicitly provided child_results"""
        for child in child_results:
            self._forget_child_result(child)



[docs]
    def wait_for_specific_children(self, child_results, forget: bool=False, **kwargs):
        """Wait for the explicitly provided child_results to run and complete"""
        if isinstance(child_results, AsyncResult):
            child_results = [child_results]
        if child_results:
            logger.debug('Waiting for enqueued children: %r' % get_tasks_names_from_results(child_results))
            try:
                wait_on_async_results_and_maybe_raise(
                    child_results,
                    caller_task=self,
                    **kwargs,
                )
            finally:
                for r in child_results:
                    self._update_child_state(r, self._UNBLOCKED)
                if forget:
                    self.forget_specific_children_results(child_results)



[docs]
    def enqueue_child(
        self,
        chain: SignatureX,
        add_to_enqueued_children: bool=True,
        block: bool=False,
        raise_exception_on_failure: Optional[bool]=None,
        apply_async_epilogue: Optional[Callable[[AsyncResult], None]]=None,
        forget: bool=False,
        **kwargs,
    ) -> Optional[AsyncResult]:
        """Schedule a child task to run"""

        if raise_exception_on_failure is not None:
            if not block:
                raise ValueError('Cannot control exceptions on child failure if we don\'t block')
            # Only set it if not None, otherwise we want to leave the downstream default
            kwargs['raise_exception_on_failure'] = raise_exception_on_failure

        if isinstance(chain, InjectArgs):
            return # FIXME: need to always return an AsyncResult

        child_result = chain.apply_async_x(self.context.bog.get_auto_inject_registry())
        if apply_async_epilogue:
            apply_async_epilogue(child_result)
        if add_to_enqueued_children:
            self._update_child_state(child_result, self._PENDING)
        if block:
            try:
                wait_on_async_results_and_maybe_raise(
                    results=child_result,
                    caller_task=self,
                    **kwargs,
                )
            finally:
                if add_to_enqueued_children:
                    self._update_child_state(child_result, self._UNBLOCKED)
                if forget:
                    self.forget_specific_children_results([child_result])
        return child_result



[docs]
    def enqueue_child_and_get_results(self,
                                      *args,
                                      return_keys: Union[str, tuple] = (),
                                      return_keys_only: bool = True,
                                      merge_children_results: bool = False,
                                      extract_from_parents: bool = True,
                                      **kwargs) -> dict:
        """Apply a ``chain``, and extract results from it.

        This is a better version of `enqueue_child_and_extract` where the defaults for
        `extract_from_children` and `extract_task_returns_only` defaults are more intuitive.
        Additionally, extract_from_parents defaults to True in this API.

        Note:
            This is shorthand for :meth:`enqueue_child` followed with :meth:`get_results`.

        Args:
            *args: Tuple of args required by  :meth:`enqueue_child`
            return_keys: A single return key string, or a tuple of keys to extract from the task results.
                The default value of :const:`None` will return a dictionary of key/value pairs for the returned results.
            return_keys_only: If set, only return results for keys specified by the tasks' `@returns`
                decorator or :attr:`returns` attribute, otherwise, returns will include key/value pairs from the BoG.
            merge_children_results: If set, extract and merge results from the children tasks as well.
            extract_from_parents: If set, will consider all results returned from tasks of the given chain (parents
                of the last task). Else will consider only results returned by the last task of the chain.
            **kwargs: Other options to :meth:`enqueue_child`

        Returns:
            The returns of `get_results`.

        See Also:
            get_results
        """

        return self.enqueue_child_and_extract(*args,
                                              return_keys=return_keys,
                                              extract_from_children=merge_children_results,
                                              extract_task_returns_only=return_keys_only,
                                              extract_from_parents=extract_from_parents,
                                              **kwargs)



[docs]
    def enqueue_child_and_extract(self,
                                  *args,
                                  **kwargs) -> Union[tuple, dict]:
        """Apply a ``chain``, and extract results from it.

        See:
            _enqueue_child_and_extract
        """

        if kwargs.pop('enqueue_once_key', None):
            raise ValueError('Invalid argument. Use the enqueue_child_once_and_extract() api.')

        return self._enqueue_child_and_extract(*args, **kwargs)


    def _enqueue_child_and_extract(self,
                                   *args,
                                   return_keys: Union[str, tuple] = (),
                                   extract_from_children: bool = True,
                                   extract_task_returns_only: bool = False,
                                   enqueue_once_key: str = '',
                                   extract_from_parents: bool = True,
                                   forget: bool = False,
                                   **kwargs) -> Union[tuple, dict]:
        """Apply a ``chain``, and extract results from it.

        Note:
            This is shorthand for :meth:`enqueue_child` followed with :meth:`extract_and_filter`.

        Args:
            *args: Tuple of args required by  :meth:`enqueue_child`
            return_keys: A single return key string, or a tuple of keys to extract from the task results.
                The default value of :const:`None` will return a dictionary of key/value pairs for the returned results.
            extract_from_children: If set, extract and merge results from the children tasks as well.
            extract_task_returns_only: If set, only return results for keys specified by the tasks' `@returns`
                decorator or :attr:`returns` attribute, otherwise, returns will include key/value pairs from the BoG.
            enqueue_once_key: a string key, which, if set will be used to check if this task needs to be run,
                Use the enqueue_child_once_and_extract wrapper to set this. Should be unique per FireX run.
            extract_from_parents: If set, will consider all results returned from tasks of the given chain (parents
                of the last task). Else will consider only results returned by the last task of the chain.
                NOTE: Will not work on reconstituted AsyncResult objects, such as those sometimes created by
                the enqueue_once API.
            **kwargs: Other options to :meth:`enqueue_child`

        Returns:
            The returns of `extract_and_filter`.

        See Also:
            extract_and_filter
        """

        # Remove block from kwargs if it exists
        _block = kwargs.pop('block', True)
        if not _block:
            logger.warning(f'enqueue_child_and_extract ignored block={_block}, '
                           'since it needs to block in order to extract results')

        if not enqueue_once_key:
            result_promise = self.enqueue_child(*args, block=True, **kwargs)
        else:
            # Need to make sure task with this key is run only once
            result_promise = self.enqueue_child_once(*args,
                                                     enqueue_once_key=enqueue_once_key,
                                                     block=True,
                                                     **kwargs)

        results = get_results(result_promise,
                              return_keys=return_keys,
                              merge_children_results=extract_from_children,
                              return_keys_only=extract_task_returns_only,
                              extract_from_parents=extract_from_parents)

        if forget:
            self.forget_specific_children_results([result_promise])

        return results


[docs]
    def enqueue_child_once(self, *args, enqueue_once_key, block=False, **kwargs) -> AsyncResult:
        """See  :`meth:`enqueue_child_once_and_extract`
        """

        if self.request.retries > 0:
            # NOTE: We presume previous run of the enqueue service failed and needs to rerun, so we use a new key.
            # There is danger here: If we are retrying before originally enqueueing this service, it's possible that
            # a regular enqueue of this service from elsewhere is still running and the new enqueue with the new
            # key will clash with that one
            enqueue_once_key = f'{enqueue_once_key}_{self.request.retries}'
            logger.info(f'Enqueue once: set new enqueue key, since this is a retry ({enqueue_once_key})')

        enqueue_child_once_uid_dbkey = get_enqueue_child_once_uid_dbkey(enqueue_once_key)
        enqueue_child_once_count_dbkey = get_enqueue_child_once_count_dbkey(enqueue_once_key)

        num_runs_attempted = self.backend.client.incr(enqueue_child_once_count_dbkey)
        if int(num_runs_attempted) == 1:
            # This is the first attempt, enqueue the child
            apply_async_epilogue = partial(_set_taskid_in_db_key,
                                           db=self.backend,
                                           db_key=enqueue_child_once_uid_dbkey)
            return self.enqueue_child(*args,
                                      block=block,
                                      apply_async_epilogue=apply_async_epilogue,
                                      **kwargs)

        # Someone else is running this; wait for uuid to be set in the backend
        logger.info(f'Skipping enqueue of task with enqueue-once key {enqueue_once_key}; '
                    f'It\'s being enqueued by a different owner.')

        # Wait for task-id to show up in the backend
        sec_to_wait = 60
        logger.info(f'Checking for task-id; might take up to {sec_to_wait} seconds.')
        loop_start_time = current_time = time.time()
        while (current_time - loop_start_time) < sec_to_wait:
            uid_of_enqueued_task = self.backend.get(enqueue_child_once_uid_dbkey)
            if uid_of_enqueued_task:
                break  # <-- we are done!
            time.sleep(0.1)
            current_time = time.time()
        else:
            # This is unexpected, since we expect uuid to be set by whoever is enqueueing this
            raise WaitOnChainTimeoutError(f'Timed out waiting for task-id to be set.'
                                          f' (enqueue-once key: {enqueue_once_key})')

        task_uid = uid_of_enqueued_task.decode()
        logger.info(f'{enqueue_once_key} is enqueued with task-id: {task_uid}')
        self._send_flame_additional_child(task_uid)

        result = AsyncResult(task_uid)
        if block:
            logger.debug(f'Waiting for results of non-child task {get_result_logging_name(result)}')
            wait_on_async_results_and_maybe_raise(results=result, caller_task=self, **kwargs)
        return result


    def _send_flame_additional_child(self, additional_child_uuid):
        self.send_firex_event_raw({ADDITIONAL_CHILDREN_KEY: [additional_child_uuid]})


[docs]
    def enqueue_child_once_and_extract(self,
                                       *args,
                                       enqueue_once_key: str,
                                       **kwargs):
        """Apply a ``chain`` with a unique key only once per FireX run, and extract results from it.

        Note:
            This is like :meth:`enqueue_child_and_extract`, but it sets `enqueue_once_key`.
        """

        if kwargs.pop('extract_from_parents', False):
            raise ValueError('Unable to extract returns from parents when using enqueue_child_once.')

        return self._enqueue_child_and_extract(*args,
                                               enqueue_once_key=enqueue_once_key,
                                               extract_from_parents=False,
                                               **kwargs)



[docs]
    def enqueue_in_parallel(
        self,
        chains: Sequence[SignatureX],
        max_parallel_chains=15,
        wait_for_completion=True,
        raise_exception_on_failure=False,
        **kwargs,
    ) -> list[AsyncResult]:
        """ This method executes the provided list of Signatures/Chains in parallel
        and returns the associated list of "async_result" objects.
        The results are returned in the same order as the input Signatures/Chains."""
        promises = []
        scheduled = []
        for c in chains:
            if len(scheduled) >= max_parallel_chains:
                # Reach the max allowed parallel chains, wait for one to complete before scheduling the next one.
                async_res = next(
                    wait_for_any_results(scheduled, raise_exception_on_failure=raise_exception_on_failure)
                )
                scheduled.remove(async_res)
            # Schedule the next child
            logger.debug(f'Enqueueing: {c.get_label()}')
            promise = self.enqueue_child(c, **kwargs)
            scheduled.append(promise)
            promises.append(promise)

        if wait_for_completion or raise_exception_on_failure:
            # Wait for all children to complete
            self.wait_for_specific_children(promises, raise_exception_on_failure=raise_exception_on_failure)
        return promises



[docs]
    def enqueue_child_from_spec(self,
                                task_spec: TaskEnqueueSpec,
                                inject_args: Optional[dict] = None):
        enqueue_opts = task_spec.enqueue_opts or dict()
        chain = task_spec.signature
        args_to_inject = self.abog.copy() if task_spec.inject_abog else {}
        if inject_args:
            args_to_inject.update(inject_args)
        if args_to_inject:
            chain = InjectArgs(**args_to_inject) | chain
        logger.debug(f'Enqueuing {task_spec}')
        self.enqueue_child(chain, **enqueue_opts)



[docs]
    def revoke_nonready_children(self):
        nonready_children = self.nonready_enqueued_children
        if nonready_children:
            logger.info('Nonready children of current task exist.')
            revoked = [self.revoke_child(child_result) for child_result in nonready_children]
            wait_for_running_tasks_from_results([result for result_list in revoked for result in result_list])



[docs]
    def revoke_child(self, result: AsyncResult, terminate=True, wait=False, timeout=None):
        name = get_result_logging_name(result)
        logger.debug('Revoking child %s' % name)
        result.revoke(terminate=terminate, wait=wait, timeout=timeout)
        revoked_results = [result]
        self._update_child_state(result, self._UNBLOCKED)
        logger.info(f'Revoked {name}')

        while result.parent:
            # Walk up the chain, since nobody is waiting on those tasks explicitly.
            result = result.parent
            if not result.ready():
                name = get_result_logging_name(result)
                logger.debug(f'Revoking parent {name}')
                result.revoke(terminate=terminate, wait=wait, timeout=timeout)
                revoked_results.append(result)
                logger.info(f'Revoked {name}')
        return revoked_results


    @property
    def root_logger_file_handler(self):
        return [handler for handler in logger.root.handlers if isinstance(handler, WatchedFileHandler)][0]

    @property
    def worker_log_file(self):
        return self.root_logger_file_handler.baseFilename

    @property
    def file_logging_dirpath(self):
        if self._file_logging_dir_path:
            return self._file_logging_dir_path
        else:
            self._file_logging_dir_path = os.path.dirname(self.worker_log_file)
            return self._file_logging_dir_path

    @property
    def logs_dir_for_worker(self):
        if self._logs_dir_for_worker:
            return self._logs_dir_for_worker
        else:
            self._logs_dir_for_worker = os.path.dirname(self.file_logging_dirpath)
            return self._logs_dir_for_worker


[docs]
    def get_task_logging_dirpath_from_request(self, request):
        # Sometimes self.request isn't populated correctly, so we need to use this version instead of the property
        if self._task_logging_dirpath:
            return self._task_logging_dirpath
        else:
            _task_logging_dirpath = os.path.join(self.file_logging_dirpath, request.hostname)
            if not os.path.exists(_task_logging_dirpath):
                os.makedirs(_task_logging_dirpath, exist_ok=True)
            self._task_logging_dirpath = _task_logging_dirpath
            return self._task_logging_dirpath


    @property
    def task_logging_dirpath(self):
        return self.get_task_logging_dirpath_from_request(request=self.request)

    @property
    def task_log_url(self):
        if self.app.conf.install_config.has_viewer():
            # FIXME: there must be a more direct way of getting this relative path.
            log_entry_rel_run_root = os.path.relpath(self.task_logfile, self.app.conf.logs_dir)
            return self.app.conf.install_config.get_log_entry_url(log_entry_rel_run_root)
        else:
            return self.task_logfile


[docs]
    def get_task_logfile_from_request(self, request):
        # Sometimes self.request isn't populated correctly, so we need to use this version instead of the property
        return self.get_task_logfile(self.get_task_logging_dirpath_from_request(request=request), self.name, request.id)


    @property
    def task_logfile(self):
        return self.get_task_logfile_from_request(request=self.request)


[docs]
    @classmethod
    def get_task_logfile(cls, task_logging_dirpath, task_name, uuid):
        return os.path.join(task_logging_dirpath, cls.get_task_logfilename(task_name, uuid))



[docs]
    @staticmethod
    def get_task_logfilename(task_name, uuid):
        return '{}_{}.html'.format(task_name, str(uuid))


    @property
    def worker_log_url(self):
        worker_log_url = self.worker_log_file
        task_label = self.task_label
        if task_label:
            worker_log_url = urljoin(worker_log_url, f'#{task_label}')
        return worker_log_url


[docs]
    def write_task_log_html_header(self):
        base_dir = self.task_logging_dirpath
        worker_name = self.request.hostname
        worker_hostname = worker_name.split('@', 1)[-1]
        html_header = JINJA_ENV.get_template('log_template.html').render(
            firex_stylesheet=get_firex_css_filepath(self.app.conf.resources_dir, relative_from=base_dir),
            logo=get_firex_logo_filepath(self.app.conf.resources_dir, relative_from=base_dir),
            firex_id=self.app.conf.uid,
            link_for_logo=self.app.conf.link_for_logo,
            header_main_title=self.name_without_orig,
            worker_log_url=os.path.relpath(self.worker_log_url, base_dir),
            worker_name=worker_name,
            worker_hostname=worker_hostname,
        )

        with open(self.task_logfile, 'w') as f:
            f.write(html_header)



[docs]
    def add_task_logfile_handler(self):
        task_logfile = self.task_logfile

        if not os.path.isfile(task_logfile):
            self.write_task_log_html_header()

        self._temp_loghandlers = {}
        fh_root = WatchedFileHandler(task_logfile, mode='a+')
        fh_root.setFormatter(self.root_logger_file_handler.formatter)
        logger.root.addHandler(fh_root)
        self._temp_loghandlers[logger.root] = fh_root

        task_logger = get_logger('celery.task')
        fh_task = logging.FileHandler(task_logfile, mode='a+')
        original_file_handler = [handler for handler in task_logger.handlers if
                                 isinstance(handler, WatchedFileHandler)][0]
        fh_task.setFormatter(original_file_handler.formatter)
        task_logger.addHandler(fh_task)
        self._temp_loghandlers[task_logger] = fh_task



[docs]
    def remove_task_logfile_handler(self):
        if self._temp_loghandlers:
            for _logger, _handler in self._temp_loghandlers.items():
                _logger.removeHandler(_handler)



[docs]
    def send_event(self, *args, **kwargs):
        if not self.request.called_directly:
            super(FireXTask, self).send_event(*args, **kwargs)



[docs]
    def duration(self):
        return get_time_from_task_start(self.request.id, self.backend)



[docs]
    def start_time(self) -> float:
        return get_task_start_time(self.request.id, self.backend)


    def _get_task_flame_configs(self) -> dict:
        decorator_flame_configs = deepcopy(getattr(self.undecorated, "flame_data_configs", {}))

        flame_value = get_attr_unwrapped(self, 'flame', None)
        task_flame_config = OrderedDict()
        if flame_value:
            if isinstance(flame_value, str):
                # Config is only a key name, fill in default config.
                task_flame_config = OrderedDict([(flame_value, create_flame_config([]))])
            elif isinstance(flame_value, list):
                # Config is a list of key names, each of which should get a default config.
                # Create list of default configs so that their order is set properly.
                default_flame_configs = []
                for _ in flame_value:
                    default_flame_configs.append(create_flame_config(default_flame_configs))
                # associated ordered default configs with key names from flame decorator.
                task_flame_config = OrderedDict([(key_name, default_flame_configs[i])
                                                 for i, key_name in enumerate(flame_value)])
            elif isinstance(flame_value, dict):
                task_flame_config = OrderedDict(flame_value)

        return decorator_flame_configs | task_flame_config


[docs]
    def send_flame(self, data: Mapping[str, Any]):
        if self.request.called_directly:
            return

        if getattr(self.context, 'flame_configs', False):
            def safe_format(formatter, fromatter_args, formatter_kwargs):
                try:
                    return formatter(*fromatter_args, **formatter_kwargs)
                except Exception as e:
                    logger.exception(e)
                    return None

            formatted_data = {}
            for flame_key, flame_config in self.context.flame_configs.items():
                # Data can be sent either because it is supplied in the input or if data was registered to be sent
                # 'on_next' during flame_data_config registration.
                if flame_key in data \
                        or flame_config['on_next'] \
                        or (flame_key is None or flame_key == '*'):
                    formatter_kwargs = {'task': self} if flame_config['bind'] else {}
                    if flame_key in data:
                        formatter_args = [data[flame_key]]
                    elif flame_config['on_next']:
                        formatter_args = flame_config['on_next_args']
                    elif flame_key is None or flame_key == '*':
                        # None means execute formatter with all data.
                        formatter_args = [data]
                    else:
                        formatter_args = []

                    format_result = safe_format(flame_config['formatter'], formatter_args, formatter_kwargs)
                    if format_result is not None:
                        formatted_data[flame_key] = {
                            'value': format_result,
                            'type': flame_config['data_type'],
                            'order': flame_config['order'],
                        }

            if formatted_data:
                self.send_firex_event_raw({'flame_data': formatted_data})
                sent_on_next_keys = [k for k, v in self.context.flame_configs.items()
                                     if v['on_next'] and k in formatted_data]
                for k in sent_on_next_keys:
                    self.context.flame_configs[k]['on_next'] = False



[docs]
    def send_firex_event_raw(self, data):
        self.send_event('task-send-flame', **data)



[docs]
    def send_firex_html(self, **kwargs):
        formatted_data = {flame_key: {'value': html_data,
                                      'type': 'html',
                                      'order': time.time()}
                          for flame_key, html_data in kwargs.items()}
        self.send_firex_event_raw({'flame_data': formatted_data})



[docs]
    def send_display_collapse(self, task_uuid: Optional[str]=None):
        """
            Collapse the current task (default), or collapse the task with the supplied UUID.
        """
        if task_uuid is None:
            task_uuid = self.request.id
        formatted_data = {
            FLAME_COLLAPSE_KEY: {
                'value': flame_collapse_formatter([{
                    'targets': ['self'],
                    'relative_to_nodes': {'type': 'task_uuid', 'value': task_uuid},
                }], self),
                'type': 'object',
                'order': time.time()}
        }
        self.send_firex_event_raw({'flame_data': formatted_data})



[docs]
    def init_auto_inject_registry(self, auto_inject_args: list[AutoInjectSpec]):
        """
            Expected to only be called once per run, by the root task. The registry
            created there then propagates to all tasks via the BoG.
        """
        # auto inject pause args, if any.
        pauses = PauseTasks.create_from_abog(self.abog)
        if pauses.pause_tasks_by_name:
            auto_inject_args = auto_inject_args + [ AutoInjectSpec(PauseTasks, PauseTasks.PAUSE_TASKS_ABOG_KEY, pauses) ]

        self.context.bog.init_auto_inject_registry(auto_inject_args)



[docs]
    def has_dynamic_returns(self) -> bool:
        # If any of the previous keys has a dynamic return, then we can't do any validation
        return any(FireXTask.is_dynamic_return(k) for k in self.return_keys)




[docs]
def undecorate_func(func):
    undecorated_func = func
    while True:
        try:
            undecorated_func = getattr(undecorated_func, '__wrapped__')
        except AttributeError:
            break
    return undecorated_func




[docs]
def undecorate(task):
    """:return: the original function that was used to create a microservice"""
    undecorated_func = undecorate_func(task.run)
    if not inspect.ismethod(task.run) or inspect.ismethod(undecorated_func):
        return undecorated_func
    else:
        return MethodType(undecorated_func, task)




[docs]
def get_attr_unwrapped(fun: Callable, attr_name, *default_value):
    """
    Unwraps a function and returns an attribute of the root function
    """
    while fun:
        try:
            return getattr(fun, attr_name)
        except AttributeError:
            fun = getattr(fun, '__wrapped__', None)
    if default_value:
        return default_value[0]
    raise AttributeError(attr_name)




[docs]
def is_jsonable(obj) -> bool:
    """Returns :const:`True` if the `obj` can be serialized via Json,
    otherwise returns :const:`False`
    """
    try:
        json.dumps(obj)
    except TypeError:
        return False
    else:
        return True


def _custom_serializers(obj) -> Optional[str]:
    # This is primarily done to make root service "unsuccessful_services" visible in run.json
    if isinstance(obj, AsyncResult) and obj.failed():
        task_name = get_task_name_from_result(obj)
        if task_name:
            if isinstance(obj.result, Exception):
                failure = first_non_chain_interrupted_exception(obj.result)
            else:
                failure = obj.result
            return f'{task_name.split(".")[-1]} failed: {failure}'

    return None



[docs]
def convert_to_serializable(obj, max_recursive_depth=10, _depth=0):

    if obj is None or isinstance(obj, (int, float, str, bool)):
        return obj

    if hasattr(obj, 'firex_serializable') and not isinstance(obj, type):
        return obj.firex_serializable()

    if isinstance(obj, datetime):
        obj = obj.isoformat()

    if isinstance(obj, type) and issubclass(obj, enum.Enum):
        return obj.__name__

    if isinstance(obj, pydantic.BaseModel):
        return obj.model_dump(mode='json')
    elif dataclasses.is_dataclass(obj):
        try:
            obj = dataclasses.asdict(obj)
        except TypeError:
            pass # e.g. enums

    if is_jsonable(obj):
        return obj

    # recursive reference guard.
    if _depth < max_recursive_depth:
        # Full object isn't jsonable, but some contents might be. Try walking the structure to get jsonable parts.
        if isinstance(obj, dict):
            jsonable_dict = {}
            for k, v in obj.items():
                serializable_key = convert_to_serializable(k, max_recursive_depth, _depth+1)
                if isinstance(serializable_key, list):
                    serializable_key = json.dumps(serializable_key)
                jsonable_dict[serializable_key] = convert_to_serializable(v, max_recursive_depth, _depth+1)
            return jsonable_dict

        # Note that it's important this DOES NOT catch strings, and it won't since strings are jsonable.
        if isinstance(obj, Iterable):
            return [convert_to_serializable(e, max_recursive_depth, _depth+1) for e in obj]

    # Either input isn't walkable (i.e. dict or iterable), or we're too deep in the structure to keep walking.
    custom_serialized = _custom_serializers(obj)
    if custom_serialized is not None:
        return custom_serialized
    return repr(obj)




[docs]
def banner(text, ch='=', length=78, content=''):
    if content:
        content = '\n'.join(['\n'.join(textwrap.wrap(line, width=length)) for line in content.split('\n')])
        content += '\n'
    spaced_text = '\n'.join(
        ['\n'.join(textwrap.wrap(line, width=length, drop_whitespace=False)) for line in text.split('\n')])
    return '\n' + ch * length + '\n' + spaced_text.center(length, ch) + '\n' + content + ch * length + '\n'




[docs]
def get_starttime_dbkey(task_id):
    return task_id + '_starttime'




[docs]
@celery.signals.task_prerun.connect
def statsd_task_prerun(sender, task, **donotcare):
    _set_task_start_time(task)




[docs]
def get_task_start_time(task_id, backend) -> Optional[float]:
    starttime_dbkey = get_starttime_dbkey(task_id)
    try:
        return float(backend.get(starttime_dbkey))
    except Exception:
        return None




[docs]
def get_time_from_task_start(task_id, backend):
    start_time = get_task_start_time(task_id, backend)
    if start_time:
        runtime = time.time() - start_time
        return runtime
    return None



def _set_task_start_time(task: FireXTask, force=False):
    starttime_dbkey = get_starttime_dbkey(task.request.id)
    if not task.backend.get(starttime_dbkey):
        task.backend.set(starttime_dbkey, time.time())


class _PausePoints(str, enum.Enum):
    PAUSE_BEFORE = 'PAUSE_BEFORE'
    PAUSE_AFTER = 'PAUSE_AFTER'
    PAUSE_ON_FAILURE = 'PAUSE_ON_FAILURE'


@dataclasses.dataclass
class _TaskPauseRequest:
    task_name: str
    pause_point: _PausePoints
    pause_hours: float

def _listy(val: Any) -> list[str]:
    if isinstance(val, str):
        l = [e.strip() for e in val.split(',') if e.strip()]
    elif isinstance(val, list):
        l = [str(e) for e in val]
    else:
        l = [str(val)]
    return l

DEFAULT_PAUSE = 4


[docs]
@dataclasses.dataclass
class PauseTasks:

    pause_tasks_by_name: dict[str, list[_TaskPauseRequest]]
    send_pause_email_notification: bool

    PAUSE_TASKS_ABOG_KEY: typing.ClassVar[str] = 'pause_tasks_reqs'


[docs]
    @staticmethod
    def get_cli_opts() -> list[dict]:
        return [
            dict(
                task_abog_key='pause_on',
                pause_point=_PausePoints.PAUSE_BEFORE,
                hours_abog_key='pause_on_hours',
            ),
            dict(
                task_abog_key='pause_before',
                pause_point=_PausePoints.PAUSE_BEFORE,
                hours_abog_key='pause_before_hours',
            ),
            dict(
                task_abog_key='pause_after',
                pause_point=_PausePoints.PAUSE_AFTER,
                hours_abog_key='pause_after_hours',
            ),
            dict(
                task_abog_key='pause_on_failure',
                pause_point=_PausePoints.PAUSE_ON_FAILURE,
                hours_abog_key='pause_on_failure_hours',
            ),
        ]



[docs]
    @staticmethod
    def get_pause_arg_names() -> list[str]:
        args = []
        for o in PauseTasks.get_cli_opts():
            args.append(o['task_abog_key'])
            args.append(o['hours_abog_key'])
        return args



[docs]
    @staticmethod
    def create_from_abog(abog: typing.Mapping[str, typing.Any]) -> 'PauseTasks':
        pause_tasks_by_name: dict[str, list[_TaskPauseRequest]] = {}
        for pause_point_opt in PauseTasks.get_cli_opts():
            if (pause_task_val := abog.get(pause_point_opt['task_abog_key'])):
                task_names : list[str] = _listy(pause_task_val)
                pause_duration = float(
                    abog.get(pause_point_opt['hours_abog_key'])
                    or abog.get('pause_duration')
                    or DEFAULT_PAUSE
                )
                for task_name in task_names:
                    if task_name not in pause_tasks_by_name:
                        pause_tasks_by_name[task_name] = []
                    pause_tasks_by_name[task_name].append(
                        _TaskPauseRequest(
                            task_name,
                            pause_point_opt['pause_point'],
                            pause_duration,
                        )
                    )

        if pause_tasks_by_name:
            logger.debug(f'Found pause requests: {pause_tasks_by_name}')

        return PauseTasks(
            pause_tasks_by_name=pause_tasks_by_name,
            send_pause_email_notification=bool(abog.get('send_pause_email_notification', True))
        )



[docs]
    def pause_point_requested(self, task_name: str, point: _PausePoints) -> typing.Optional[_TaskPauseRequest]:
        if ( pause_specs := self.pause_tasks_by_name.get(task_name) ):
            return next(
                (ps for ps in pause_specs if ps.pause_point == point),
                None)
        return None