Source code for weaver.datatype

"""
Definitions of types used by tokens.
"""

import abc
import base64
import copy
import enum
import inspect
import io
import json
import os
import re
import shutil
import tempfile
import traceback
import uuid
import warnings
from datetime import datetime, timedelta
from decimal import ConversionSyntax, Decimal
from io import BytesIO
from logging import ERROR, INFO, getLevelName, getLogger
from secrets import compare_digest, token_hex
from typing import TYPE_CHECKING, cast
from urllib.parse import urljoin, urlparse

import colander
import pyramid.httpexceptions
import requests.exceptions
from cryptography.fernet import Fernet
from cwlprov.tool import Tool as CWLProvTool
from dateutil.parser import parse as dt_parse
from docker.auth import decode_auth  # pylint: disable=E0611
from owslib.util import ServiceException as OWSServiceException
from owslib.wps import Process as ProcessOWS, WPSException
from pywps import Process as ProcessWPS
from pywps.app import WPSRequest
from pywps.response.describe import DescribeResponse
from werkzeug.wrappers import Request as WerkzeugRequest

from weaver import xml_util
from weaver.exceptions import ProcessInstanceError, ServiceParsingError
from weaver.execute import (
    ExecuteControlOption,
    ExecuteMode,
    ExecuteResponse,
    ExecuteReturnPreference,
    ExecuteTransmissionMode
)
from weaver.formats import AcceptLanguage, ContentType, OutputFormat, repr_json
from weaver.processes.constants import (
    CWL_NAMESPACE_WEAVER_ID,
    CWL_REQUIREMENT_APP_DOCKER,
    CWL_REQUIREMENT_APP_DOCKER_GPU,
    CWL_REQUIREMENT_APP_OGC_API,
    CWL_REQUIREMENT_APP_WPS1,
    JobProcessingEntityType,
    JobStatusType,
    ProcessSchema
)
from weaver.processes.convert import get_field, json2oas_io, normalize_ordered_io, null, ows2json, wps2json_io
from weaver.processes.types import ProcessType
from weaver.provenance import ProvenanceFormat
from weaver.quotation.status import QuoteStatus
from weaver.status import JOB_STATUS_CATEGORIES, Status, StatusCategory, map_status
from weaver.store.base import StoreProcesses
from weaver.transform.const import EXCLUDED_TYPES
from weaver.transform.utils import extend_alternate_formats
from weaver.utils import localize_datetime  # for backward compatibility of previously saved jobs not time-locale-aware
from weaver.utils import (
    LoggerHandler,
    VersionFormat,
    apply_number_with_unit,
    as_version_major_minor_patch,
    extend_instance,
    fully_qualified_name,
    get_job_log_msg,
    get_log_date_fmt,
    get_log_fmt,
    get_path_kvp,
    get_settings,
    is_valid_url,
    now,
    request_extra
)
from weaver.visibility import Visibility
from weaver.warning import NonBreakingExceptionWarning, UnsupportedOperationWarning
from weaver.wps.utils import get_wps_client, get_wps_output_dir, get_wps_url
from weaver.wps_restapi import swagger_definitions as sd
from weaver.wps_restapi.utils import get_wps_restapi_base_url

if TYPE_CHECKING:
    from logging import Logger
    from typing import Any, Callable, Dict, IO, Iterator, List, Optional, Tuple, Union
    from typing_extensions import TypeAlias

    from owslib.wps import WebProcessingService

    from weaver.execute import (
        AnyExecuteControlOption,
        AnyExecuteMode,
        AnyExecuteResponse,
        AnyExecuteReturnPreference,
        AnyExecuteTransmissionMode
    )
    from weaver.formats import AnyContentType
    from weaver.processes.constants import AnyJobProcessingEntityType, ProcessSchemaType
    from weaver.processes.types import AnyProcessType
    from weaver.provenance import AnyProvenanceFormat, ProvenancePathType
    from weaver.quotation.status import AnyQuoteStatus
    from weaver.status import AnyStatusType, StatusType
    from weaver.typedefs import (
        AnyLogLevel,
        AnyProcess,
        AnyProcessRef,
        AnyRequestType,
        AnyServiceRef,
        AnySettingsContainer,
        AnyUUID,
        AnyVersion,
        CWL,
        ExecutionInputs,
        ExecutionOutputs,
        ExecutionSubscribers,
        JobResults,
        JSON,
        Link,
        Metadata,
        Number,
        Path,
        Price,
        QuoteProcessParameters,
        QuoteProcessResults,
        QuoteStepOutputParameters,
        Statistics
    )
    from weaver.visibility import AnyVisibility

    # pylint: disable=C0103  # false-positive invalid name for typing

[docs]
    AnyParams = Dict[str, Any]

    AuthenticationType: TypeAlias = "Authentication"
    DockerAuthenticationType: TypeAlias = "DockerAuthentication"
    AnyAuthentication = Union[AuthenticationType, DockerAuthenticationType]


[docs]
LOGGER = getLogger(__name__)




[docs]
class DictBase(dict):
    """
    Dictionary with extended attributes auto-``getter``/``setter`` for convenience.

    Explicitly overridden ``getter``/``setter`` attributes are called instead of ``dict``-key ``get``/``set``-item
    to ensure corresponding checks and/or value adjustments are executed before applying it to the sub-``dict``.
    """

    def __setattr__(self, item, value):
        """
        Uses an existing property setter if defined in the subclass or employs the default dictionary setter otherwise.
        """
        prop = getattr(type(self), item)
        if isinstance(prop, property) and prop.fset is not None:
            prop.fset(self, value)  # noqa
        else:
            super(DictBase, self).__setitem__(item, value)

    def __getitem__(self, item):
        """
        Uses an existing property getter if defined in the subclass or employs the default dictionary getter otherwise.
        """
        prop = getattr(type(self), item)
        if isinstance(prop, property) and prop.fget is not None:
            return prop.fget(self)  # noqa
        elif item in self:
            return getattr(self, item, None)
        else:
            raise AttributeError(f"Can't get attribute '{item}' in '{fully_qualified_name(self)}'.")

    def __str__(self):
        # type: () -> str
        return type(self).__name__

    def __repr__(self):
        # type: () -> str
        _type = fully_qualified_name(self)
        _repr = dict.__repr__(self)
        return f"{_type} ({_repr})"

    @classmethod

[docs]
    def properties(cls, fget=True, fset=True):
        # type: (bool, bool) -> Iterator[str]
        """
        Get names of properties stored in the object, optionally filtered by read-only or write-only conditions.
        """
        return iter(
            name for name, prop in inspect.getmembers(cls)
            if not name.startswith("_") and isinstance(prop, property) and (
                (fget and fset and prop.fget is not None and prop.fset is not None) or
                (fget and not fset and prop.fget is not None and prop.fset is None) or
                (not fget and fset and prop.fget is None and prop.fset is not None)
            )
        )



[docs]
    def dict(self):
        # type: () -> AnyParams
        """
        Generate a dictionary representation of the object, but with inplace resolution of attributes as applicable.
        """
        # update any entries by key with their attribute
        _dict = {key: getattr(self, key, dict.__getitem__(self, key)) for key, val in self.items()}
        # then, ensure any missing key gets added if a getter property exists for it
        props = {prop[0] for prop in inspect.getmembers(self) if not prop[0].startswith("_") and prop[0] not in _dict}
        for key in props:
            prop = getattr(type(self), key)
            if isinstance(prop, property) and prop.fget is not None:
                _dict[key] = prop.fget(self)  # noqa
        return _dict





[docs]
class AutoBase(DictBase):
    """
    Base that automatically converts literal class members to properties also accessible by dictionary keys.

    .. code-block:: python

        class Data(AutoBase):
            field = 1
            other = None

        d = Data()
        d.other         # returns None
        d.other = 2     # other is modified
        d.other         # returns 2
        dict(d)         # returns {'field': 1, 'other': 2}
        d.field         # returns 1
        d["field"]      # also 1 !
    """
    def __new__(cls, *args, **kwargs):
        extra_props = set(dir(cls)) - set(dir(DictBase))
        auto_cls = cast(
            "AutoBase",
            DictBase.__new__(cls, *args, **kwargs)
        )
        for prop in extra_props:
            prop_func = property(
                lambda self, key: dict.__getitem__(self, key),                  # type: ignore
                lambda self, key, value: dict.__setattr__(self, key, value)     # type: ignore
            )
            default = getattr(auto_cls, prop, None)
            setattr(auto_cls, prop, prop_func)
            AutoBase.__setattr__(auto_cls, prop, default)
        return auto_cls

    def __getitem__(self, item):
        return dict.__getitem__(self, item)

    def __setattr__(self, key, value):
        # set both as object and dict reference
        DictBase.__setattr__(self, key, value)
        dict.__setattr__(self, key, value)




[docs]
class Base(DictBase):
    """
    Base interface for all data-types.
    """

    def __str__(self):
        # type: () -> str
        return f"{type(self).__name__} <{self.id}>"

    @property
    def __name__(self):
        # type: () -> str
        return fully_qualified_name(self)

    @property

[docs]
    def id(self):
        raise NotImplementedError()


    @property

[docs]
    def uuid(self):
        # type: () -> uuid.UUID
        return self.id



[docs]
    def json(self):
        # type: () -> JSON
        """
        Obtain the JSON data representation for response body.

        .. note::
            This method implementation should validate the JSON schema against the API definition whenever
            applicable to ensure integrity between the represented data type and the expected API response.
        """
        raise NotImplementedError("Method 'json' must be defined for JSON request item representation.")



[docs]
    def params(self):
        # type: () -> AnyParams
        """
        Obtain the internal data representation for storage.

        .. note::
            This method implementation should provide a JSON-serializable definition of all fields representing
            the object to store.
        """
        raise NotImplementedError("Method 'params' must be defined for storage item representation.")





[docs]
class LocalizedDateTimeProperty(property):
    """
    Property that ensures date-time localization is applied on the stored/retrieved value as required.
    """

    def __init__(self,
                 fget=None,             # type: Callable[[Any], Optional[datetime]]
                 fset=None,             # type: Callable[[Any, Union[datetime, str]], None]
                 fdel=None,             # type: Callable[[Any], None]
                 doc=None,              # type: str
                 default_now=False,     # type: bool
                 ):                     # type: (...) -> None

[docs]
        self.default_now = default_now

        fget = fget or self.__get__
        fset = fset or self.__set__
        super(LocalizedDateTimeProperty, self).__init__(fget=fget, fset=fset, fdel=fdel, doc=doc)

    def __set_name__(self, owner, name):
        # type: (Any, str) -> None
        self.name = name  # pylint: disable=W0201

    def __get__(self, instance, *_):
        # type: (Any, Optional[Any]) -> Optional[datetime]
        if instance is None:
            # allow access to the descriptor as class attribute 'getattr(type(instance), property-name)'
            return self  # noqa
        # ensure that any 'fget' specified at property creation is employed
        if self.fget != self.__get__:  # pylint: disable=W0143
            return self.fget(instance)
        dt = instance.get(self.name, None)
        if not dt:
            if self.default_now:
                cur_dt = now()
                self.__set__(instance, cur_dt)
                return cur_dt
            return None
        return localize_datetime(dt)

    def __set__(self, instance, value):
        # type: (Any, Union[datetime, str]) -> None
        # ensure that any 'fset' specified at property creation is employed
        if self.fset != self.__set__:  # pylint: disable=W0143
            return self.fset(instance, value)
        if isinstance(value, str):
            value = dt_parse(value)
        if not isinstance(value, datetime):
            name = fully_qualified_name(instance)
            raise TypeError(f"Type 'datetime' is required for '{name}.{self.name}'")
        instance[self.name] = localize_datetime(value)




[docs]
class Service(Base):
    """
    Dictionary that contains OWS services.

    It always has ``url`` key.
    """

    def __init__(self, *args, **kwargs):
        # type: (*Any, **Any) -> None
        super(Service, self).__init__(*args, **kwargs)
        if "name" not in self:
            raise TypeError("Service 'name' is required")
        if "url" not in self:
            raise TypeError("Service 'url' is required")
        self["_wps"] = None

    @property

[docs]
    def id(self):
        return self.name


    @property

[docs]
    def url(self):
        """
        Service URL.
        """
        return dict.__getitem__(self, "url")


    @property

[docs]
    def name(self):
        """
        Service name.
        """
        return dict.__getitem__(self, "name")


    @property

[docs]
    def type(self):
        """
        Service type.
        """
        return self.get("type", ProcessType.WPS_REMOTE)


    @property

[docs]
    def public(self):
        """
        Flag if service has public access.
        """
        # TODO: public access can be set via auth parameter.
        return self.get("public", False)


    @property

[docs]
    def auth(self):
        """
        Authentication method: public, token, cert.
        """
        return self.get("auth", "token")



[docs]
    def json(self):
        # type: () -> JSON
        # TODO: apply swagger type deserialize schema check if returned in a response
        return self.params()



[docs]
    def params(self):
        # type: () -> AnyParams
        return {
            "url": self.url,
            "name": self.name,
            "type": self.type,
            "public": self.public,
            "auth": self.auth
        }



[docs]
    def wps(self, container=None, **kwargs):
        # type: (AnySettingsContainer, **Any) -> WebProcessingService
        """
        Obtain the remote WPS service definition and metadata.

        Stores the reference locally to avoid re-fetching it needlessly for future reference.
        """
        try:
            _wps = self.get("_wps")
            if _wps is None:
                # client retrieval could also be cached if recently fetched and not yet invalidated
                self["_wps"] = _wps = get_wps_client(self.url, container=container, **kwargs)
            return _wps
        except (OWSServiceException, xml_util.ParseError) as exc:
            msg = f"Invalid XML returned by WPS [{self.name}] at [{self.url}] cannot be parsed."
            raise ServiceParsingError(json={"description": msg, "cause": str(exc), "error": exc.__class__.__name__})



[docs]
    def links(self, container, fetch=True, self_link=None):
        # type: (AnySettingsContainer, bool, Optional[str]) -> List[Link]
        """
        Obtains the links relevant to the service :term:`Provider`.

        :param container: object that helps retrieve instance details, namely the host URL.
        :param fetch: whether to attempt retrieving more precise details from the remote provider.
        :param self_link: name of a section that represents the current link that will be returned.
        """
        if fetch:
            wps = self.wps(container=container)
            wps_lang = wps.language
            wps_url = wps.url
        else:
            wps_url = self.url
            wps_lang = AcceptLanguage.EN_CA  # assume, cannot validate

        wps_url = urljoin(wps_url, urlparse(wps_url).path)
        wps_url = f"{wps_url}?service=WPS&request=GetCapabilities"
        api_url = get_wps_restapi_base_url(container)
        svc_url = f"{api_url}/providers/{self.name}"
        proc_url = f"{svc_url}/processes"
        links = [
            {
                "rel": "service-desc",
                "title": "Service description (GetCapabilities).",
                "href": wps_url,
                "hreflang": wps_lang,
                "type": ContentType.APP_XML,
            },
            {
                "rel": "service",
                "title": "Service definition.",
                "href": svc_url,
                "hreflang": AcceptLanguage.EN_CA,
                "type": ContentType.APP_JSON,
            },
            {
                "rel": self_link or "self",
                "title": "Provider definition.",
                "href": svc_url,
                "hreflang": AcceptLanguage.EN_CA,
                "type": ContentType.APP_JSON,
            },
            {
                "rel": sd.OGC_API_PROC_REL_PROCESSES_URI,
                "title": "Listing of processes provided by this service.",
                "href": proc_url,
                "hreflang": AcceptLanguage.EN_CA,
                "type": ContentType.APP_JSON,
            },
        ]
        return links



[docs]
    def metadata(self, container):
        # type: (AnySettingsContainer) -> List[Metadata]
        """
        Obtains the metadata relevant to the service provider.
        """
        wps = self.wps(container=container)
        wps_lang = wps.language
        # FIXME: add more metadata retrieved from 'wps.identification' and 'wps.provider.contact' (?)
        #        if so, should be included only in "long description", while "summary" only returns below info
        meta = [
            {
                "type": "provider-name",
                "title": "Provider Name",
                "role": "http://www.opengis.net/eoc/applicationContext/providerMetadata",
                "value": wps.provider.name,
                "lang": wps_lang
            },
            {
                "type": "provider-site",
                "title": "Provider Name",
                "role": "http://www.opengis.net/eoc/applicationContext/providerMetadata",
                "value": wps.provider.url,
                "lang": wps_lang
            },
            {
                "type": "contact-name",
                "title": "Contact Name",
                "role": "http://www.opengis.net/eoc/applicationContext/providerMetadata",
                "value": wps.provider.contact.name,
                "lang": wps_lang
            }
        ]
        return meta



[docs]
    def keywords(self, container=None):
        # type: (AnySettingsContainer) -> List[str]
        """
        Obtains the keywords relevant to the service provider.
        """
        wps = self.wps(container=container)
        return wps.identification.keywords



[docs]
    def summary(self, container, fetch=True, ignore=False):
        # type: (AnySettingsContainer, bool, bool) -> Optional[JSON]
        """
        Obtain the summary information from the provider service.

        When metadata fetching is disabled, the generated summary will contain only information available locally.

        :param container: Employed to retrieve application settings.
        :param fetch: Indicates whether metadata should be fetched from remote.
        :param ignore: Indicates if failing metadata retrieval/parsing should be silently discarded or raised.
        :return: generated summary information.
        :raises ServiceParsingError:
            If the target service provider is not reachable, content is not parsable or any other error related to
            validating the service that needs to be understood for summary creation.
        :raises colander.Invalid: If the generated response format is not valid according to schema definition.
        """
        try:
            # FIXME: not implemented (https://github.com/crim-ca/weaver/issues/130)
            if not ProcessType.is_wps(self.type):
                return None
            self.check_accessible(container, ignore=ignore)
            # basic information always available (local)
            data = {
                "id": self.name,
                "url": self.url,  # remote URL (bw-compat, also in links)
                "type": ProcessType.WPS_REMOTE,
                "public": self.public,
                "links": self.links(container, fetch=fetch),
            }
            # retrieve more metadata from remote if possible and requested
            if fetch:
                wps = self.wps(container)
                data.update({
                    "title": getattr(wps.identification, "title", None),
                    "description": getattr(wps.identification, "abstract", None),
                    "keywords": self.keywords(container),
                    "metadata": self.metadata(container),
                })
            return sd.ProviderSummarySchema().deserialize(data)
        except colander.Invalid as exc:
            LOGGER.error("Failed schema validation on otherwise valid parsing of provider definition.", exc_info=exc)
            raise  # invalid schema on our side, don't ignore it
        except ServiceParsingError:
            raise
        except Exception as exc:
            msg = f"Exception occurred while fetching or parsing WPS [{self.name}] at [{self.url}]"
            err_msg = f"{msg}: {exc!r}"
            LOGGER.debug(err_msg, exc_info=exc)
            if ignore:
                warnings.warn(err_msg, NonBreakingExceptionWarning)
                return None
            raise ServiceParsingError(json={"description": msg, "cause": str(exc), "error": fully_qualified_name(exc)})



[docs]
    def processes(self, container, ignore=False):
        # type: (AnySettingsContainer, bool) -> Optional[List[Process]]
        """
        Obtains a list of remote service processes in a compatible :class:`weaver.datatype.Process` format.

        .. note::
            Remote processes won't be stored to the local process storage.

        :param container: Employed to retrieve application settings.
        :param ignore: Indicates if failing service retrieval/parsing should be silently discarded or raised.
        :raises ServiceParsingError: If parsing failed and was NOT requested to be ignored.
        :return:
            If parsing was successful, list of converted remote service processes.
            If parsing failed and was requested to be ignored, returns ``None`` to distinguish from empty process list.
        """
        # FIXME: support other providers (https://github.com/crim-ca/weaver/issues/130)
        if not ProcessType.is_wps(self.type):
            return []
        try:
            wps = self.wps(container)
        except ServiceParsingError as exc:
            err_msg = repr(exc)
            LOGGER.debug(err_msg, exc_info=exc)
            if ignore:
                warnings.warn(err_msg, NonBreakingExceptionWarning)
                return None
            raise
        settings = get_settings(container)
        return [Process.convert(process, self, settings) for process in wps.processes]



[docs]
    def check_accessible(self, settings, ignore=True):
        # type: (AnySettingsContainer, bool) -> bool
        """
        Verify if the service URL is accessible.
        """
        try:
            # some WPS don't like HEAD request, so revert to normal GetCapabilities
            # otherwise use HEAD because it is faster to only 'ping' the service
            if ProcessType.is_wps(self.type):
                meth = "GET"
                url = f"{self.url}?service=WPS&request=GetCapabilities"
            else:
                meth = "HEAD"
                url = self.url
            # - allow 500 for services that incorrectly handle invalid request params, but at least respond
            #   (should be acceptable in this case because the 'ping' request is not necessarily well-formed)
            # - allow 400/405 for bad request/method directly reported by the service for the same reasons
            # - enforce quick timeout (but don't allow 408 code) to avoid long pending connexions that never resolve
            allowed_codes = [200, 400, 405, 500]
            resp = request_extra(meth, url, timeout=2, settings=settings, allowed_codes=allowed_codes)
            code = resp.status_code
            accessible = code in allowed_codes
            if not accessible and not ignore:
                msg = f"Service [{self.name}] at [{self.url}] response status code [{code}] is not acceptable."
                raise ServiceParsingError(json={
                    "description": msg,
                    "cause": "Cannot validate or parse service metadata since it is not accessible.",
                })
            return accessible
        except (requests.exceptions.RequestException, pyramid.httpexceptions.HTTPException) as exc:
            msg = f"Exception occurred while checking service [{self.name}] accessibility at [{self.url}]"
            warnings.warn(f"{msg}: {exc!r}", NonBreakingExceptionWarning)
            if not ignore:
                raise ServiceParsingError(json={
                    "description": msg,
                    "cause": "Cannot validate or parse service metadata since it is not accessible.",
                    "error": exc.__class__.__name__
                })
        return False





[docs]
class Job(Base, LoggerHandler):
    """
    Dictionary that contains :term:`Job` details for local :term:`Process` or remote :term:`OWS` execution.

    It always has ``id`` and ``task_id`` keys.
    """

    def __init__(self, *args, **kwargs):
        # type: (*Any, **Any) -> None
        super(Job, self).__init__(*args, **kwargs)
        if "task_id" not in self:
            raise TypeError(f"Parameter 'task_id' is required for '{self.__name__}' creation.")
        if not isinstance(self.id, (str, uuid.UUID)):
            raise TypeError(f"Type 'str' or 'UUID' is required for '{self.__name__}.id'")
        self["__tmpdir"] = None


[docs]
    def update_from(self, job):
        # type: (Job) -> None
        """
        Forwards any internal or control properties from the specified :class:`Job` to this one.
        """
        self["__tmpdir"] = job.get("__tmpdir")



[docs]
    def cleanup(self):
        # type: () -> None
        _tmpdir = self.get("__tmpdir")
        if isinstance(_tmpdir, str) and os.path.isdir(_tmpdir):
            shutil.rmtree(_tmpdir, ignore_errors=True)


    @property

[docs]
    def tmpdir(self):
        # type: () -> Path
        """
        Optional temporary directory available for the :term:`Job` to store files needed for its operation.

        It is up to the caller to remove the contents by calling :meth:`cleanup`.
        """
        _tmpdir = self.get("__tmpdir")
        if not _tmpdir:
            _tmpdir = self["__tmpdir"] = tempfile.mkdtemp()
        return _tmpdir


    @staticmethod

[docs]
    def _get_message(message, size_limit=None):
        # type: (str, Optional[int]) -> str
        msg_len = len(message)
        size_limit = size_limit if isinstance(size_limit, int) and size_limit > 0 else 1024**2
        if len(message) > size_limit:
            msg_size = apply_number_with_unit(msg_len, binary=True, decimals=2)
            return f"<message clipped due to large dimension ({msg_size})>"
        return message



[docs]
    def _get_log_msg(self, msg=None, status=None, progress=None, size_limit=None):
        # type: (Optional[str], Optional[AnyStatusType], Optional[Number], Optional[int]) -> str
        msg = self._get_message(msg or self.status_message, size_limit=size_limit)
        status = map_status(status or self.status)
        progress = max(0, min(100, progress or self.progress))
        return get_job_log_msg(duration=self.duration_str, progress=progress, status=status, message=msg)


    @staticmethod

[docs]
    def _get_err_msg(error, size_limit=None):
        # type: (WPSException, Optional[int]) -> str
        error_msg = Job._get_message(error.text, size_limit=size_limit)
        return f"{error_msg} - code={error.code} - locator={error.locator}"



[docs]
    def log(self, level, message, *args, **kwargs):
        # type: (AnyLogLevel, str, *str, **Any) -> None
        """
        Provides the :class:`LoggerHandler` interface, allowing to pass the :term:`Job` directly as a logger reference.

        The same parameters as :meth:`save_log` can be provided.
        """
        message = message.format(*args, **kwargs)
        return self.save_log(level=level, message=message, **kwargs)



[docs]
    def save_log(self,
                 *,
                 errors=None,           # type: Optional[Union[str, Exception, WPSException, List[WPSException]]]
                 logger=None,           # type: Optional[Logger]
                 message=None,          # type: Optional[str]
                 level=INFO,            # type: AnyLogLevel
                 status=None,           # type: Optional[AnyStatusType]
                 progress=None,         # type: Optional[Number]
                 size_limit=None,       # type: Optional[int]
                 ):                     # type: (...) -> None
        """
        Logs the specified error and/or message, and adds the log entry to the complete job log.

        For each new log entry, additional :class:`Job` properties are added according to :meth:`Job._get_log_msg`
        and the format defined by :func:`get_job_log_msg`.

        :param errors:
            An error message or a list of WPS exceptions from which to log and save generated message stack.
        :param logger:
            An additional :class:`Logger` for which to propagate logged messages on top saving them to the job.
        :param message:
            Explicit string to be logged, otherwise use the current :py:attr:`Job.status_message` is used.
        :param level:
            Logging level to apply to the logged ``message``. This parameter is ignored if ``errors`` are logged.
        :param status:
            Override status applied in the logged message entry, but does not set it to the job object.
            Uses the current :attr:`Job.status` value if not specified. Must be one of :mod:`Weaver.status` values.
        :param progress:
            Override progress applied in the logged message entry, but does not set it to the job object.
            Uses the current :attr:`Job.progress` value if not specified.
        :param size_limit:
            Log message entries that individually exceed the limit will be clipped with a generic message.
            The parameter is provided for convenience, but take note that setting a too large value could cause the
            complete :term:`Job` to fail saving to the database if its total size exceeds the document limit.

        .. note::
            The job object is updated with the log but still requires to be pushed to database to actually persist it.
        """
        if isinstance(errors, WPSException):
            errors = [errors]
        elif isinstance(errors, Exception):
            errors = self._get_message(str(errors), size_limit=size_limit)
        if isinstance(errors, str):
            log_msg = [(ERROR, self._get_log_msg(message, status=status, progress=progress, size_limit=size_limit))]
            self.exceptions.append(errors)
        elif isinstance(errors, list):
            log_msg = [
                (
                    ERROR,
                    self._get_log_msg(
                        self._get_err_msg(error, size_limit=size_limit),
                        status=status,
                        progress=progress,
                        size_limit=size_limit,
                    )
                )
                for error in errors
            ]
            self.exceptions.extend([{
                "Code": error.code,
                "Locator": error.locator,
                "Text": self._get_message(error.text, size_limit=size_limit),
            } for error in errors])
        else:
            log_msg = [(level, self._get_log_msg(message, status=status, progress=progress, size_limit=size_limit))]
        for lvl, msg in log_msg:
            fmt_data = {
                "asctime": now().strftime(get_log_date_fmt()),
                "levelname": getLevelName(lvl),
                "name": self.__name__,
                "message": msg,
            }
            fmt_msg = get_log_fmt() % fmt_data
            if len(self.logs) == 0 or self.logs[-1] != fmt_msg:
                self.logs.append(fmt_msg)
                if logger:
                    logger.log(lvl, msg)


    @property

[docs]
    def id(self):
        # type: () -> uuid.UUID
        """
        Job UUID to retrieve the details from storage.
        """
        job_id = self.get("id")
        if not job_id:
            job_id = uuid.uuid4()
            self["id"] = job_id
        if isinstance(job_id, str):
            return uuid.UUID(job_id)
        return job_id


    @property

[docs]
    def task_id(self):
        # type: () -> Optional[AnyUUID]
        """
        Reference Task UUID attributed by the ``Celery`` worker that monitors and executes this job.
        """
        task_id = self.get("task_id", None)
        try:
            # task ID can be a temporary non-UUID value
            if isinstance(task_id, str):
                return uuid.UUID(task_id)
        except ValueError:
            pass
        return task_id


    @task_id.setter
    def task_id(self, task_id):
        # type: (AnyUUID) -> None
        if not isinstance(task_id, (str, uuid.UUID)):
            raise TypeError(f"Type 'str' or 'UUID' is required for '{self.__name__}.task_id'")
        self["task_id"] = task_id

    @property

[docs]
    def wps_id(self):
        # type: () -> Optional[uuid.UUID]
        """
        Reference WPS Request/Response UUID attributed by the executed ``PyWPS`` process.

        This UUID matches the status-location, log and output directory of the WPS process.
        This parameter is only available when the process is executed on this local instance.

        .. seealso::
            - :attr:`Job.request`
            - :attr:`Job.response`
        """
        wps_id = self.get("wps_id", None)
        if isinstance(wps_id, str):
            return uuid.UUID(wps_id)
        return wps_id


    @wps_id.setter
    def wps_id(self, wps_id):
        # type: (AnyUUID) -> None
        if not isinstance(wps_id, (str, uuid.UUID)):
            raise TypeError(f"Type 'str' or 'UUID' is required for '{self.__name__}.wps_id'")
        self["wps_id"] = wps_id

    @property

[docs]
    def wps_url(self):
        # type: () -> Optional[str]
        """
        Service URL reference for :term:`WPS` interface.

        .. seealso::
            - :attr:`Process.processEndpointWPS1`
            - :attr:`Service.url`
        """
        return self.get("wps_url", None)


    @wps_url.setter
    def wps_url(self, service):
        # type: (Optional[str]) -> None
        if not isinstance(service, str):
            raise TypeError(f"Type 'str' is required for '{self.__name__}.wps_url'")
        self["wps_url"] = service

    @property

[docs]
    def service(self):
        # type: () -> Optional[str]
        """
        Service identifier of the corresponding remote process.

        .. seealso::
            - :attr:`Service.id`
        """
        return self.get("service", None)


    @service.setter
    def service(self, service):
        # type: (Optional[AnyServiceRef]) -> None
        if isinstance(service, Service):
            service = service.id
        if not isinstance(service, str) or service is None:
            raise TypeError(f"Type 'str' is required for '{self.__name__}.service'")
        self["service"] = service

    @property

[docs]
    def process(self):
        # type: () -> Optional[str]
        """
        Process identifier of the corresponding remote process.

        .. seealso::
            - :attr:`Process.id`
        """
        return self.get("process", None)


    @process.setter
    def process(self, process):
        # type: (Optional[AnyProcessRef]) -> None
        if isinstance(process, Process):
            process = process.id
        if not isinstance(process, str) or process is None:
            raise TypeError(f"Type 'str' is required for '{self.__name__}.process'")
        self["process"] = process

    @property

[docs]
    def processing_entity_type(self):
        # type: () -> AnyJobProcessingEntityType
        return JobProcessingEntityType.OGC_API_PROCESSES


    @property

[docs]
    def type(self):
        # type: () -> str
        """
        Obtain the type of the element associated to the creation of this job.

        .. seealso::
            - Defined in https://schemas.opengis.net/ogcapi/processes/part1/1.0/openapi/schemas/statusInfo.yaml.
            - Queried with https://docs.ogc.org/is/18-062r2/18-062r2.html#toc49 (Parameter Type section).
        """
        if self.service is None:
            return JobStatusType.PROCESS
        return JobStatusType.PROVIDER


    @property

[docs]
    def title(self):
        # type: () -> Optional[str]
        return self.get("title", None)


    @title.setter
    def title(self, title):
        # type: (Optional[str]) -> None
        if not (isinstance(title, str) or not title):  # disallow empty title as well
            raise TypeError(f"Type 'str' or 'None' is required for '{self.__name__}.title'")
        self["title"] = title


[docs]
    def _get_inputs(self):
        # type: () -> ExecutionInputs
        if self.get("inputs") is None:
            return {}
        return dict.__getitem__(self, "inputs")



[docs]
    def _set_inputs(self, inputs):
        # type: (Optional[ExecutionInputs]) -> None
        self["inputs"] = inputs


    # allows to correctly update list by ref using 'job.inputs.extend()'

[docs]
    inputs = property(
        _get_inputs,  # type: ignore
        _set_inputs,  # type: ignore
        doc="Input values and reference submitted for execution.",
    )



[docs]
    def _get_outputs(self):
        # type: () -> Optional[ExecutionOutputs]
        return self.get("outputs")



[docs]
    def _set_outputs(self, outputs):
        # type: (Optional[ExecutionOutputs]) -> None
        self["outputs"] = outputs



[docs]
    outputs = property(
        _get_outputs,  # type: ignore
        _set_outputs,  # type: ignore
        doc="Output transmission modes submitted for execution.",
    )


    @property

[docs]
    def user_id(self):
        # type: () -> Optional[Union[AnyUUID, int]]
        return self.get("user_id", None)


    @user_id.setter
    def user_id(self, user_id):
        # type: (Optional[Union[AnyUUID, int]]) -> None
        if not isinstance(user_id, (int, str, uuid.UUID)) or user_id is None:
            raise TypeError(f"Type 'int', 'str' or a UUID is required for '{self.__name__}.user_id'")
        self["user_id"] = user_id

    @property

[docs]
    def success(self):
        # type: () -> bool
        return map_status(self.status, category=True) == StatusCategory.SUCCESS


    @property

[docs]
    def status(self):
        # type: () -> Status
        return Status.get(self.get("status"), Status.UNKNOWN)


    @status.setter
    def status(self, status):
        # type: (StatusType) -> None
        value = Status.get(status)
        if value == Status.ACCEPTED and self.status == Status.RUNNING:
            LOGGER.debug(traceback.extract_stack())
        if value not in Status:
            statuses = list(Status.values())
            name = self.__name__
            raise ValueError(f"Status '{status}' is not valid for '{name}.status', must be one of {statuses!s}'")
        self["status"] = value

    @property

[docs]
    def status_message(self):
        # type: () -> str
        return self.get("status_message", "no message")


    @status_message.setter
    def status_message(self, message):
        # type: (Optional[str]) -> None
        if message is None:
            return
        if not isinstance(message, str):
            raise TypeError(f"Type 'str' is required for '{self.__name__}.status_message'")
        self["status_message"] = message

    @property

[docs]
    def status_location(self):
        # type: () -> Optional[str]
        return self.get("status_location", None)


    @status_location.setter
    def status_location(self, location_url):
        # type: (Optional[str]) -> None
        if not isinstance(location_url, str) or location_url is None:
            raise TypeError(f"Type 'str' is required for '{self.__name__}.status_location'")
        self["status_location"] = location_url

    @property

[docs]
    def subscribers(self):
        # type: () -> Optional[ExecutionSubscribers]
        return self.get("subscribers")


    @subscribers.setter
    def subscribers(self, subscribers):
        # type: (Optional[ExecutionSubscribers]) -> None
        if subscribers and not (
            isinstance(subscribers, dict) and
            all(
                sub_type and isinstance(sub_type, str) and
                sub and isinstance(sub, str) and
                val and isinstance(val, str)
                for sub_type, subs in subscribers.items()
                for sub, val in (subs if isinstance(subs, dict) else {None: None}).items()
            )
        ):
            raise TypeError(
                "Mapping of subscriber types, status and notification references "
                f"is required for '{self.__name__}.subscribers'."
            )
        self["subscribers"] = subscribers or None

    @property

[docs]
    def accept_type(self):
        # type: () -> Optional[str]
        return self.get("accept_type")


    @accept_type.setter
    def accept_type(self, content_type):
        # type: (Optional[str]) -> None
        if not (isinstance(content_type, str) or content_type is None):
            raise TypeError(f"Type 'str' is required for '{self.__name__}.accept_type'")
        self["accept_type"] = content_type or None

    @property

[docs]
    def accept_language(self):
        # type: () -> Optional[str]
        return self.get("accept_language")


    @accept_language.setter
    def accept_language(self, language):
        # type: (Optional[str]) -> None
        if not (isinstance(language, str) or language is None):
            raise TypeError(f"Type 'str' is required for '{self.__name__}.accept_language'")
        self["accept_language"] = language or None

    @property

[docs]
    def accept_profile(self):
        # type: () -> Optional[str]
        return self.get("accept_profile")


    @accept_profile.setter
    def accept_profile(self, profile):
        # type: (Optional[str]) -> None
        if not (isinstance(profile, str) or profile is None):
            raise TypeError(f"Type 'str' is required for '{self.__name__}.accept_profile'")
        if profile and not is_valid_url(profile):
            raise ValueError(f"Valid URI is required for '{self.__name__}.accept_profile'")
        self["accept_profile"] = profile or None

    @property

[docs]
    def execute_async(self):
        # type: () -> bool
        return self.execution_mode == ExecuteMode.ASYNC


    @property

[docs]
    def execute_sync(self):
        # type: () -> bool
        return self.execution_mode == ExecuteMode.SYNC


    @property

[docs]
    def execution_mode(self):
        # type: () -> AnyExecuteMode
        return ExecuteMode.get(self.get("execution_mode"), ExecuteMode.AUTO)


    @execution_mode.setter
    def execution_mode(self, mode):
        # type: (Union[AnyExecuteMode, str]) -> None
        exec_mode = ExecuteMode.get(mode)
        if exec_mode not in ExecuteMode:
            modes = list(ExecuteMode.values())
            raise ValueError(f"Invalid value for '{self.__name__}.execution_mode'. Must be one of {modes}")
        self["execution_mode"] = mode

    @property

[docs]
    def execution_wait(self):
        # type: () -> Optional[int]
        """
        Execution time (in seconds) to wait for a synchronous response.
        """
        if self.execute_async:
            return None
        return self.get("execution_wait")


    @execution_wait.setter
    def execution_wait(self, wait):
        # type: (Optional[int]) -> None
        if not (wait is None or isinstance(wait, int)):
            raise ValueError(f"Invalid value for '{self.__name__}.execution_wait'. Must be None or an integer.")
        self["execution_wait"] = wait

    @property

[docs]
    def execution_response(self):
        # type: () -> AnyExecuteResponse
        out = self.setdefault("execution_response", ExecuteResponse.DOCUMENT)
        if out not in ExecuteResponse.values():
            out = ExecuteResponse.DOCUMENT
        self["execution_response"] = out
        return out


    @execution_response.setter
    def execution_response(self, response):
        # type: (Optional[Union[AnyExecuteResponse, str]]) -> None
        if response is None:
            exec_resp = ExecuteResponse.DOCUMENT
        else:
            exec_resp = ExecuteResponse.get(response)
        if exec_resp not in ExecuteResponse:
            resp = list(ExecuteResponse.values())
            raise ValueError(f"Invalid value for '{self.__name__}.execution_response'. Must be one of {resp}")
        self["execution_response"] = exec_resp

    @property

[docs]
    def execution_return(self):
        # type: () -> AnyExecuteReturnPreference
        ret = self.setdefault("execution_return", ExecuteReturnPreference.MINIMAL)  # almost equivalent to 'document'
        if ret not in ExecuteReturnPreference.values():
            ret = ExecuteReturnPreference.MINIMAL
        self["execution_return"] = ret
        return ret


    @execution_return.setter
    def execution_return(self, return_preference):
        # type: (Optional[Union[AnyExecuteReturnPreference, str]]) -> None
        if return_preference is None:
            exec_ret = ExecuteReturnPreference.MINIMAL
        else:
            exec_ret = ExecuteReturnPreference.get(return_preference)
        if exec_ret not in ExecuteReturnPreference:
            return_prefs = list(ExecuteReturnPreference.values())
            raise ValueError(f"Invalid value for '{self.__name__}.execution_return'. Must be one of {return_prefs}")
        self["execution_return"] = exec_ret

    @property

[docs]
    def is_local(self):
        # type: () -> bool
        return self.get("is_local", not self.service)


    @is_local.setter
    def is_local(self, is_local):
        # type: (bool) -> None
        if not isinstance(is_local, bool):
            raise TypeError(f"Type 'bool' is required for '{self.__name__}.is_local'")
        self["is_local"] = is_local

    @property

[docs]
    def is_workflow(self):
        # type: () -> bool
        return self.get("is_workflow", False)


    @is_workflow.setter
    def is_workflow(self, is_workflow):
        # type: (bool) -> None
        if not isinstance(is_workflow, bool):
            raise TypeError(f"Type 'bool' is required for '{self.__name__}.is_workflow'")
        self["is_workflow"] = is_workflow

    @property

[docs]
    def is_finished(self):
        # type: () -> bool
        return self.finished is not None



[docs]
    def mark_finished(self):
        # type: () -> None
        self["finished"] = now()



[docs]
    def _get_updated(self):
        # type: () -> datetime
        updated = self.get("updated")
        # backward compatibility when not already set
        if not updated:
            if self.status == map_status(Status.ACCEPTED):
                updated = self.created
            elif self.is_finished:
                updated = self.finished
            else:
                updated = self.started
            updated = localize_datetime(updated or now())
            self.updated = updated  # apply to remain static until saved
        return localize_datetime(updated)



[docs]
    created = LocalizedDateTimeProperty(default_now=True)


[docs]
    started = LocalizedDateTimeProperty()


[docs]
    finished = LocalizedDateTimeProperty()


[docs]
    updated = LocalizedDateTimeProperty(fget=_get_updated)  # type: ignore


    @property

[docs]
    def duration(self):
        # type: () -> Optional[timedelta]
        if not self.started:
            return None
        final_time = self.finished or now()
        return localize_datetime(final_time) - localize_datetime(self.started)


    @property

[docs]
    def duration_str(self):
        # type: () -> str
        duration = self.duration
        if duration is None:
            return "00:00:00"
        return str(duration).split(".", 1)[0].zfill(8)  # "HH:MM:SS"


    @property

[docs]
    def progress(self):
        # type: () -> Number
        return self.get("progress", 0)


    @progress.setter
    def progress(self, progress):
        # type: (Number) -> None
        if not isinstance(progress, (int, float)):
            raise TypeError(f"Number is required for '{self.__name__}.progress'")
        if progress < 0 or progress > 100:
            raise ValueError(f"Value must be in range [0,100] for '{self.__name__}.progress'")
        self["progress"] = progress

    @property

[docs]
    def statistics(self):
        # type: () -> Optional[Statistics]
        """
        Collected statistics about used memory and processing units if available.
        """
        return self.get("statistics")


    @statistics.setter
    def statistics(self, stats):
        # type: (Statistics) -> None
        if not isinstance(stats, dict):
            raise TypeError(f"Type 'dict' is required for '{self.__name__}.statistics'")
        self["statistics"] = stats


[docs]
    def _get_results(self):
        # type: () -> JobResults
        if self.get("results") is None:
            self["results"] = []
        return dict.__getitem__(self, "results")



[docs]
    def _set_results(self, results):
        # type: (JobResults) -> None
        if not isinstance(results, list):
            raise TypeError(f"Type 'list' is required for '{self.__name__}.results'")
        self["results"] = results


    # allows to correctly update list by ref using 'job.results.extend()'

[docs]
    results = property(
        _get_results,  # type: ignore
        _set_results,  # type: ignore
        doc="Output values and references that resulted from execution.",
    )



[docs]
    def _get_exceptions(self):
        # type: () -> List[Union[str, Dict[str, str]]]
        if self.get("exceptions") is None:
            self["exceptions"] = []
        return dict.__getitem__(self, "exceptions")



[docs]
    def _set_exceptions(self, exceptions):
        # type: (List[Union[str, Dict[str, str]]]) -> None
        if not isinstance(exceptions, list):
            raise TypeError(f"Type 'list' is required for '{self.__name__}.exceptions'")
        self["exceptions"] = exceptions


    # allows to correctly update list by ref using 'job.exceptions.extend()'

[docs]
    exceptions = property(_get_exceptions, _set_exceptions)  # type: ignore



[docs]
    def _get_logs(self):
        # type: () -> List[str]
        if self.get("logs") is None:
            self["logs"] = []
        return dict.__getitem__(self, "logs")



[docs]
    def _set_logs(self, logs):
        # type: (List[str]) -> None
        if not isinstance(logs, list):
            raise TypeError(f"Type 'list' is required for '{self.__name__}.logs'")
        self["logs"] = logs


    # allows to correctly update list by ref using 'job.logs.extend()'

[docs]
    logs = property(_get_logs, _set_logs)  # type: ignore



[docs]
    def _get_tags(self):
        # type: () -> List[Optional[str]]
        if self.get("tags") is None:
            self["tags"] = []
        return dict.__getitem__(self, "tags")



[docs]
    def _set_tags(self, tags):
        # type: (List[Optional[str]]) -> None
        if not isinstance(tags, list):
            raise TypeError(f"Type 'list' is required for '{self.__name__}.tags'")
        self["tags"] = tags


    # allows to correctly update list by ref using 'job.tags.extend()'

[docs]
    tags = property(_get_tags, _set_tags)  # type: ignore


    @property

[docs]
    def access(self):
        # type: () -> Visibility
        """
        Job visibility access from execution.
        """
        return Visibility.get(self.get("access"), Visibility.PRIVATE)


    @access.setter
    def access(self, visibility):
        # type: (str) -> None
        """
        Job visibility access from execution.
        """
        vis = Visibility.get(visibility)
        if visibility not in Visibility.values():
            raise ValueError(f"Invalid 'visibility' value '{visibility!s}' specified for '{self.__name__}.access'")
        self["access"] = vis

    @property

[docs]
    def context(self):
        # type: () -> Optional[str]
        """
        Job outputs context.
        """
        return self.get("context") or None


    @context.setter
    def context(self, context):
        # type: (Optional[str]) -> None
        """
        Job outputs context.
        """
        if not (isinstance(context, str) or context is None):
            raise TypeError(f"Type 'str' or 'None' is required for '{self.__name__}.context'")
        self["context"] = context

    @property

[docs]
    def request(self):
        # type: () -> Optional[str]
        """
        XML request for WPS execution submission as string (binary).
        """
        return self.get("request", None)


    @request.setter
    def request(self, request):
        # type: (Optional[str]) -> None
        """
        XML request for WPS execution submission as string (binary).
        """
        if isinstance(request, xml_util.XML):
            request = xml_util.tostring(request)
        self["request"] = request

    @property

[docs]
    def response(self):
        # type: () -> Optional[str]
        """
        XML status response from WPS execution submission as string (binary).
        """
        return self.get("response", None)


    @response.setter
    def response(self, response):
        # type: (Optional[str]) -> None
        """
        XML status response from WPS execution submission as string (binary).
        """
        if isinstance(response, xml_util.XML):
            response = xml_util.tostring(response)
        self["response"] = response


[docs]
    def process_url(self, container=None):
        # type: (Optional[AnySettingsContainer], Optional[str]) -> str
        settings = get_settings(container)
        base_url = get_wps_restapi_base_url(settings)
        if self.service is not None:
            base_url += sd.provider_service.path.format(provider_id=self.service)
        proc_url = sd.process_service.path.format(process_id=self.process)
        return base_url + proc_url



[docs]
    def job_url(self, container=None, extra_path=None):
        # type: (Optional[AnySettingsContainer], Optional[str]) -> str
        proc_url = self.process_url(container)
        job_url = sd.job_service.path.format(job_id=self.id)
        return proc_url + job_url + (extra_path or "")



[docs]
    def status_url(self, container=None):
        # type: (Optional[AnySettingsContainer]) -> str
        return self.job_url(container=container)



[docs]
    def logs_url(self, container=None):
        # type: (Optional[AnySettingsContainer]) -> str
        return self.job_url(container=container, extra_path="/logs")



[docs]
    def exceptions_url(self, container=None):
        # type: (Optional[AnySettingsContainer]) -> str
        return self.job_url(container=container, extra_path="/exceptions")



[docs]
    def inputs_url(self, container=None):
        # type: (Optional[AnySettingsContainer]) -> str
        return self.job_url(container=container, extra_path="/inputs")



[docs]
    def outputs_url(self, container=None):
        # type: (Optional[AnySettingsContainer]) -> str
        return self.job_url(container=container, extra_path="/outputs")



[docs]
    def results_url(self, container=None):
        # type: (Optional[AnySettingsContainer]) -> str
        return self.job_url(container=container, extra_path="/results")



[docs]
    def result_path(self, job_id=None, output_id=None, file_name=None):
        # type: (Optional[AnyUUID], Optional[str], Optional[str]) -> str
        """
        Obtains a *relative* result path, according to requested parameters and the :term:`Job` definition.

        The generated path will automatically apply the relative job context if defined.

        :param job_id: Override ID to employ for the job path. Otherwise, uses the usually job UUID by default.
            This should be used for cases where the ID is "not yet" established by the job, or that an alternate
            location based on a UUID established by another source must be employed.
        :param output_id:
            Output ID to refer to in the path. If omitted, the path prefix will stop at the job ID fragment.
        :param file_name:
            Output file name and extension to apply to the path. If omitted, the path prefix will stop at the output ID.
        :return: Resolved *relative* result path.
        """
        result_job_id = str(job_id or self.id)
        result_job_path = os.path.join(self.context, result_job_id) if self.context else result_job_id
        if not output_id:
            return result_job_path
        result_job_path = os.path.join(result_job_path, output_id)
        if not file_name:
            return result_job_path
        result_job_path = os.path.join(result_job_path, file_name)
        return result_job_path



[docs]
    def get_all_possible_formats_links(self, url, results):
        """
        Get direct links to all outputs in any possible format.

        :param url: The base URL for constructing links.
        :param results: A list of result dictionaries containing "mimeType" and "identifier".
        :returns: A list of dictionaries representing the links to all possible output formats.
        """
        links = []
        for result in results:
            media_type = get_field(result, "mimeType", search_variations=True)
            if media_type and media_type not in EXCLUDED_TYPES:
                id = get_field(result, "identifier", search_variations=True)
                formats = [{"mediaType": media_type}]
                extended_formats = extend_alternate_formats(formats)
                links.extend([
                    {
                        "href": f"{url}/{id}?f={fmt['mediaType']}",
                        "rel": "output",
                        "id": id,
                        "type": fmt["mediaType"],
                        "title": f"Link to job {id} result in {fmt['mediaType']}"
                    }
                    for fmt in extended_formats
                ])
        return links



[docs]
    def prov_url(self, container=None, extra_path=None):
        # type: (Optional[AnySettingsContainer], Optional[ProvenancePathType]) -> str
        extra_path = str(extra_path or "")
        prov_path = f"/prov{extra_path}"
        return self.job_url(container=container, extra_path=prov_path)



[docs]
    def prov_path(self, container=None, extra_path=None, prov_format=None):
        # type: (Optional[AnySettingsContainer], Optional[ProvenancePathType], Optional[AnyProvenanceFormat]) -> str
        """
        Obtain the relative path of the ``PROV`` contents.
        """
        job_path = self.result_path()
        prov_path = f"{job_path}-prov"
        prov_format = ProvenanceFormat.get(prov_format, allow_media_type=True)
        _prov_path_mapping = {
            (None, None): prov_path,  # the directory itself with all metadata
            ("/prov", None): f"{prov_path}/metadata/provenance/primary.cwlprov.json",
            ("/prov", ProvenanceFormat.PROV_JSON): f"{prov_path}/metadata/provenance/primary.cwlprov.json",
            ("/prov", ProvenanceFormat.PROV_JSONLD): f"{prov_path}/metadata/provenance/primary.cwlprov.jsonld",
            ("/prov", ProvenanceFormat.PROV_TURTLE): f"{prov_path}/metadata/provenance/primary.cwlprov.ttl",
            ("/prov", ProvenanceFormat.PROV_XML): f"{prov_path}/metadata/provenance/primary.cwlprov.xml",
            ("/prov", ProvenanceFormat.PROV_N): f"{prov_path}/metadata/provenance/primary.cwlprov.provn",
            ("/prov", ProvenanceFormat.PROV_NT): f"{prov_path}/metadata/provenance/primary.cwlprov.nt",
        }  # type: Dict[Tuple[Optional[ProvenancePathType], ProvenanceFormat], str]
        key = (extra_path, prov_format)
        resolved_path = _prov_path_mapping.get(key)
        if resolved_path:
            out_dir = get_wps_output_dir(container)
            return os.path.join(out_dir, resolved_path)
        return resolved_path



[docs]
    def prov_data(
        self,
        container=None,     # type: Optional[AnySettingsContainer]
        extra_path=None,    # type: Optional[Union[ProvenancePathType, str]]
        prov_format=None,   # type: AnyContentType
    ):                      # type: (...) -> Tuple[Optional[str], Optional[AnyContentType]]
        """
        Read or retrieve data from the packaged provenance directory contents associated to the :term:`Job`.
        """
        prov_path = self.prov_path(container=container, extra_path=extra_path, prov_format=prov_format)
        if prov_path and os.path.isfile(prov_path):
            with open(prov_path, mode="r", encoding="utf-8") as prov_f:
                data = prov_f.read()
            fmt = prov_format
        else:
            prov_path = self.prov_path(container=container)
            if not prov_path or not os.path.isdir(prov_path):
                return None, None
            path = str(extra_path).split("/prov/", 1)[-1]
            frag = path.strip("/").split("/")
            oper, params = frag[0], frag[1:]
            args = ["-d", prov_path, oper]
            if oper == "run":
                args.extend(["--steps", "--start", "--end", "--duration", "--labels", "--inputs", "--outputs"])
            elif oper in ["inputs", "outputs"]:
                args.extend(["--parameters", "--format", "uris"])
            args.extend(params)
            tool = CWLProvTool(args)
            tool.output = io.StringIO()  # override the buffer argument to "print"
            result = tool.main()  # noqa  # function annotated to return nothing, but sometimes returns an error code
            if result not in [0, None]:
                return None, None
            tool.output.seek(0)
            data = tool.output.read()
            fmt = ContentType.TEXT_PLAIN
        if fmt == ContentType.APP_YAML:
            data = json.loads(data)
            data = OutputFormat.convert(data, to=OutputFormat.YAML)
        return data, fmt



[docs]
    def links(self, container=None, self_link=None):
        # type: (Optional[AnySettingsContainer], Optional[str]) -> List[Link]
        """
        Obtains the JSON links section of the response body for a :term:`Job`.

        If :paramref:`self_link` is provided (e.g.: `"outputs"`) the link for that corresponding item will also
        be added as `self` entry to the links. It must be a recognized job link field.

        :param container: object that helps retrieve instance details, namely the host URL.
        :param self_link: name of a section that represents the current link that will be returned.
        """
        settings = get_settings(container)
        html_on = settings.get("weaver.wps_restapi_html", True)
        base_url = get_wps_restapi_base_url(settings)
        job_url = self.job_url(settings)  # full URL
        job_path = base_url + sd.job_service.path.format(job_id=self.id)
        job_exec = f"{job_url.rsplit('/', 1)[0]}/execution"
        job_list = base_url + sd.jobs_service.path
        job_links = [  # type: List[Link]
            {"href": job_url, "rel": "status", "title": "Job status."},  # OGC
            {"href": job_url, "rel": "monitor", "title": "Job monitoring location."},  # IANA
            {"href": get_path_kvp(job_path, f=OutputFormat.JSON), "type": ContentType.APP_JSON,
             "rel": "alternate", "title": "Job status generic endpoint."},  # IANA
            {"href": job_list, "rel": sd.OGC_API_PROC_REL_JOB_LIST_URI,  # OGC
             "title": "List of submitted jobs."},
            {"href": job_exec, "rel": sd.OGC_API_PROC_REL_EXECUTE_URI,
             "title": "New job submission endpoint for the corresponding process."},
            {"href": f"{job_url}/inputs", "rel": "inputs",  # unofficial
             "title": "Submitted job inputs for process execution."}
        ]
        if html_on:
            job_links.append({
                "href": get_path_kvp(job_path, f=OutputFormat.HTML),
                "rel": "alternate",
                "title": "HTML Job Status",
                "type": ContentType.TEXT_HTML,
            })
        if self_link in ["status", None]:
            job_links.extend([
                {"href": job_list, "rel": "collection", "title": "List of submitted jobs."},  # IANA
                {"href": sd.OGC_API_PROC_PROFILE_JOB_DESC_URI, "rel": "profile", "title": "Job response profile."},
            ])

        if self.status in JOB_STATUS_CATEGORIES[StatusCategory.FINISHED]:
            job_status = map_status(self.status)
            if job_status == Status.SUCCESSFUL:
                job_links.extend([
                    {"href": f"{job_url}/outputs", "rel": "outputs",  # unofficial
                     "title": "Job outputs of successful process execution (extended outputs with metadata)."},
                    {"href": f"{job_url}/results", "rel": sd.OGC_API_PROC_REL_JOB_RESULTS_URI,
                     "title": "Job results of successful process execution (direct output values mapping)."},
                    {"href": f"{job_url}/statistics", "rel": "statistics",  # unofficial
                     "title": "Job statistics collected following process execution."},
                    {"href": f"{job_url}/prov", "rel": "provenance",  # unofficial
                     "title": "Job provenance collected following process execution."},
                    {"href": f"{job_url}/prov", "rel": "https://www.w3.org/ns/prov",  # unofficial
                     "title": "Job provenance collected following process execution."},
                ])
                f_links = self.get_all_possible_formats_links(url=job_url, results=self.results)
                if len(f_links) > 0:
                    job_links.extend(f_links)
            else:
                job_links.append({
                    "href": f"{job_url}/exceptions", "rel": sd.OGC_API_PROC_REL_EXCEPTIONS_URI,
                    "title": "List of job exceptions if applicable in case of failing job."
                })
        job_links.extend([
            {
                "href": f"{job_url}/logs", "rel": "logs",  # unofficial
                "title": "List of collected job logs during process execution."
            },
            {
                # official, same as 'rel="[ogc-rel:log]"'
                "href": f"{job_url}/logs", "rel": sd.OGC_API_PROC_REL_JOB_LOG_URI,
                "title": "List of collected job logs during process execution."
            }
        ])
        if self_link in ["status", "inputs", "outputs", "results", "logs", "exceptions", "provenance"]:
            self_link_body = list(filter(lambda _link: _link["rel"].endswith(self_link), job_links))[-1]
            self_link_body = copy.deepcopy(self_link_body)
            # back to specific job if we are in one of its sub-endpoints
            self_link_up = {"href": job_url, "rel": "up", "title": "Job status details."}
        else:
            self_link_body = {"href": job_url, "title": "Job status."}
            # back to full list of jobs if we are already on the job itself
            self_link_up = {"href": job_list, "rel": "up", "title": "List of submitted jobs."}
        self_link_body["rel"] = "self"
        job_links.extend([self_link_body, self_link_up])
        link_meta = {"type": ContentType.APP_JSON, "hreflang": AcceptLanguage.EN_CA}
        for link in job_links:
            for meta, param in link_meta.items():
                link.setdefault(meta, param)
        return job_links



[docs]
    def summary(self, validate=True, **kwargs):
        # type: (bool, **JSON) -> JSON
        job_json = {
            "id": self.id,  # provide both 'id' and 'jobID' for convenience/backward compatibility
            "jobID": self.id,
            "processID": self.process,
            "providerID": self.service,  # dropped by validator if not applicable
            "type": self.type,
            "status": map_status(self.status),
            "processingEntityType": self.processing_entity_type,
        }
        job_json.update(**kwargs)
        return sd.JobSummary().deserialize(job_json) if validate else job_json



[docs]
    def json(self, container=None, **kwargs):  # pylint: disable=W0221,arguments-differ
        # type: (Optional[AnySettingsContainer], **JSON) -> JSON
        """
        Obtains the :term:`JSON` data representation for :term:`Job` response body.

        .. note::
            Settings are required to update API shortcut URLs to job additional information.
            Without them, paths will not include the API host, which will not resolve to full URI.
        """
        settings = get_settings(container) if container else {}
        job_json = {
            "id": self.id,  # provide both 'id' and 'jobID' for convenience/backward compatibility
            "jobID": self.id,
            "processID": self.process,
            "providerID": self.service,
            "processingEntityType": self.processing_entity_type,
            "type": self.type,
            "title": self.title,
            "status": map_status(self.status),
            "message": self.status_message,
            "created": self.created,
            "started": self.started,
            "finished": self.finished,
            "updated": self.updated,
            "duration": self.duration_str,
            "runningDuration": self.duration,
            "runningSeconds": self.duration.total_seconds() if self.duration is not None else None,
            # TODO: available fields not yet employed (https://github.com/crim-ca/weaver/issues/129)
            "nextPoll": None,
            "expirationDate": None,
            "estimatedCompletion": None,
            "percentCompleted": self.progress,
            # new name as per OGC-API, enforced integer
            # https://schemas.opengis.net/ogcapi/processes/part1/1.0/openapi/schemas/statusInfo.yaml
            "progress": int(self.progress),
            "links": self.links(settings, self_link="status")
        }
        job_json.update(**kwargs)
        return sd.JobStatusInfo().deserialize(job_json)



[docs]
    def params(self):
        # type: () -> AnyParams
        return {
            "id": self.id,
            "task_id": self.task_id,
            "wps_id": self.wps_id,
            "wps_url": self.wps_url,
            "service": self.service,
            "process": self.process,
            "title": self.title,
            "inputs": self.inputs,
            "outputs": self.outputs,
            "user_id": self.user_id,
            "status": self.status,
            "status_message": self.status_message,
            "status_location": self.status_location,
            "execution_response": self.execution_response,
            "execution_return": self.execution_return,
            "execution_mode": self.execution_mode,
            "execution_wait": self.execution_wait,
            "is_workflow": self.is_workflow,
            "created": self.created,
            "started": self.started,
            "finished": self.finished,
            "updated": self.updated,
            "progress": self.progress,
            "results": self.results,
            "statistics": self.statistics,
            "exceptions": self.exceptions,
            "logs": self.logs,
            "tags": self.tags,
            "access": self.access,
            "context": self.context,
            "request": self.request,
            "response": self.response,
            "subscribers": self.subscribers,
            "accept_type": self.accept_type,
            "accept_language": self.accept_language,
            "accept_profile": self.accept_profile,
        }





[docs]
class AuthenticationTypes(enum.Enum):

[docs]
    DOCKER = "docker"


[docs]
    VAULT = "vault"





[docs]
class Authentication(Base):
    """
    Authentication details to store details required for process operations.
    """

    def __init__(self, auth_scheme, auth_token=None, auth_username=None, auth_password=None, auth_link=None, **kwargs):
        # type: (str, Optional[str], Optional[str], Optional[str], Optional[str], **Any) -> None
        super(Authentication, self).__init__(**kwargs)
        # ensure values are provided and of valid format
        if auth_token and (auth_username or auth_password):
            raise ValueError(
                "Cannot initialize Authentication method with token and username/password credentials simultaneously."
            )
        if not auth_token and auth_username and auth_password:
            auth = self.from_credentials(auth_username, auth_password, auth_link=auth_link, **kwargs)
            auth_scheme, auth_token = auth.scheme, auth.token
        self.scheme = auth_scheme
        if auth_link:
            self.link = auth_link
        self.token = auth_token or ""
        self.setdefault("id", uuid.uuid4())

    @property
    @abc.abstractmethod

[docs]
    def type(self):
        # type: () -> AuthenticationTypes
        raise NotImplementedError


    @property

[docs]
    def id(self):
        # type: () -> uuid.UUID
        _id = dict.__getitem__(self, "id")
        if isinstance(_id, str):
            return uuid.UUID(_id)
        return _id


    @property

[docs]
    def link(self):
        # type: () -> Optional[str]
        return dict.get(self, "link", None)


    @link.setter
    def link(self, link):
        # type: (str) -> None
        if not isinstance(link, str):
            raise TypeError(f"Type 'str' is required for '{self.__name__}.url', not '{type(link)}'.")
        self["link"] = link

    @property

[docs]
    def token(self):
        # type: () -> str
        return dict.__getitem__(self, "token")


    @token.setter
    def token(self, token):
        # type: (str) -> None
        if not isinstance(token, str):
            raise TypeError(f"Type 'str' is required for '{self.__name__}.token', not '{type(token)}'.")
        self["token"] = token

    @property

[docs]
    def scheme(self):
        # type: () -> str
        return dict.__getitem__(self, "scheme")


    @scheme.setter
    def scheme(self, scheme):
        # type: (str) -> None
        if not isinstance(scheme, str):
            raise TypeError(f"Type 'str' is required for '{self.__name__}.scheme', not '{type(scheme)}'.")
        self["scheme"] = scheme


[docs]
    def json(self):
        return None  # in case it bubbles up by error, never provide it as JSON



[docs]
    def params(self):
        # type: () -> AnyParams
        return {
            "id": self.id,
            "type": self.type.value,
            "link": self.link,
            "token": self.token,
            "scheme": self.scheme
        }


    @classmethod

[docs]
    def from_credentials(cls, username, password, **params):
        # type: (str, str, **Any) -> AnyAuthentication
        token = base64.b64encode(f"{username}:{password}".encode("utf-8")).decode("utf-8")
        params.setdefault("auth_type", cls.type)
        params["auth_scheme"] = "Basic"
        params["auth_token"] = token
        return cls.from_params(**params)


    @classmethod

[docs]
    def from_params(cls, **params):
        # type: (**Any) -> AnyAuthentication
        """
        Obtains the specialized :class:`Authentication` using loaded parameters from :meth:`params`.
        """
        for param in list(params):
            if not param.startswith("auth_"):
                params[f"auth_{param}"] = params[param]
        auth_type = params.pop("auth_type", None)
        params.pop("type", None)  # remove type that must be enforced by specialized class property
        auth_known = [DockerAuthentication, VaultFile]
        auth_cls = list(filter(lambda auth: auth_type in [auth.type, auth.type.value], auth_known))
        if not auth_cls:
            raise TypeError(f"Unknown authentication type: {auth_type!s}")
        auth_obj = auth_cls[0](**params)
        keys = list(auth_obj.params())
        for key in list(auth_obj):
            if key not in keys:
                del auth_obj[key]
        return auth_obj





[docs]
class DockerAuthentication(Authentication):
    """
    Authentication associated to a :term:`Docker` image to retrieve from a private registry given by the reference link.

    .. seealso::
        :ref:`app_pkg_docker`
    """

[docs]
    DOCKER_LINK_REGEX = re.compile(r"""
        (?:^(?P<uri>
            # protocol
            (?P<protocol>(?:http)s?:\/\/)?
            # registry
            (?:(?P<registry>
                (?:
                # IPv4
                (?P<reg_ipv4>(?:\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3}))
                |
                # IPv6
                (?P<reg_ipv6>(?:\[[a-f0-9:]+\]))
                |
                # domain
                (?P<reg_domain>
                    (?:[a-zA-Z](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?\.)+
                    (?:[a-zA-Z]{2,6}\.?|[a-zA-Z0-9-]{2,}\.?))
                |
                # hostname
                (?P<reg_host>([A-Za-z][A-Za-z0-9\-]*[A-Za-z0-9]))
                )
                # port
                (?P<reg_port>:\d+)?
                # path, but leaving at least one slash out for 'repo/image' part
                # the last '/' is matched in <image_ref> portion
                (?:\/?|[\/?\.](?P<reg_path>\S+(\/[\/?\.]\S)*))
            ))
            # registry is optional and not greedy, default to DockerHub
            \/)?
            # image reference
            (?P<image>
                # force 'repo/image:label'
                # disallow plain 'image:label' since remote dockers are always expected
                (?P<image_repo>[0-9a-z_-]{1,40}
                # nested project/repo parts
                (?:\/?|[\/?\.]\S+(\/[\/?\.]\S))*)
                (?:\/
                (?P<image_name>[0-9a-z_-]{1,40})
                )
                # label can be a literal or a variable, optional for 'latest'
                (?::
                (?P<label>[a-z0-9][a-z0-9._-]{1,38}[a-z0-9]|\${[A-Z][A-Z0-9_]{,38}[A-Z0-9]})
                )?
            )
        $)
    """, re.X)  # extended to ignore whitespaces and comments


[docs]
    DOCKER_REGISTRY_DEFAULT_DOMAIN = "index.docker.io"


[docs]
    DOCKER_REGISTRY_DEFAULT_URI = f"https://{DOCKER_REGISTRY_DEFAULT_DOMAIN}/v1/"  # DockerHub


[docs]
    type = AuthenticationTypes.DOCKER


    # NOTE:
    #   Specific parameter names are important for reload from database using 'Authentication.from_params'
    def __init__(self, auth_link, auth_scheme="Basic", auth_token=None, **kwargs):
        # type: (str, str, Optional[str], **Any) -> None
        """
        Initialize the authentication reference for pulling a Docker image from a protected registry.

        :param auth_link: Fully qualified Docker registry image link (``{registry-url}/{image}:{label}``).
        :param auth_scheme: Authentication scheme (Basic, Bearer, etc.) if required.
        :param kwargs:
            Additional parameters including authentication token, username/password credentials according
            to specified scheme, and other definitions to load contents already parsed from database.
        """
        matches = re.match(self.DOCKER_LINK_REGEX, auth_link)
        if not matches:
            raise ValueError(f"Invalid Docker image link does not conform to expected format: [{auth_link}]")
        groups = matches.groupdict()
        LOGGER.debug("Parsed Docker image/registry link:\n%s", json.dumps(groups, indent=2))
        if not groups["image"]:
            raise ValueError(f"Invalid Docker image reference does not conform to image format: {auth_link}")
        # special case for DockerHub, since it is default, it is often omitted, but could be partially provided
        # swap the domain by the full URI in that case because that's what is expected when doing plain 'docker login'
        registry = groups["reg_domain"]
        image = groups["image"]
        if registry in [self.DOCKER_REGISTRY_DEFAULT_DOMAIN, "", None]:
            if not registry:
                LOGGER.debug("No registry specified for Docker image, using default DockerHub registry.")
            # when "URI" fragment was detected but is not a real URI (since 'reg_domain' empty), link is invalid
            # (i.e.: there is no URI repository, so nowhere to send Auth token since not default DockerHub)
            if groups["uri"] not in [self.DOCKER_REGISTRY_DEFAULT_URI, "", None]:
                registry = groups["uri"]
                raise ValueError(f"Invalid registry specifier detected but not a valid URI: [{registry}]")
            registry = self.DOCKER_REGISTRY_DEFAULT_URI
        # otherwise, resolve the possible confusion between nested URI/paths vs nested repository/project
        elif groups["reg_path"]:
            image = f"{groups['reg_path']}/{groups['image']}"
        LOGGER.debug("Resolved Docker image/registry from link: [%s, %s]", registry, image)
        self["image"] = image
        self["registry"] = registry
        super(DockerAuthentication, self).__init__(
            auth_scheme, auth_token=auth_token, auth_link=auth_link, **kwargs
        )

    @property

[docs]
    def credentials(self):
        # type: () -> JSON
        """
        Generates the credentials to submit the login operation based on the authentication token and scheme.
        """
        if self.scheme == "Basic":
            try:
                usr, pwd = decode_auth(self.token)
            # when token is invalid such as wrong encoding or missing ':', error is raised
            except ValueError:
                return {}
            return {"registry": self.registry, "username": usr, "password": pwd}  # nosec
        return {}


    @property

[docs]
    def image(self):
        # type: () -> str
        """
        Obtains the image portion of the reference without repository prefix.
        """
        return dict.__getitem__(self, "image")


    @property

[docs]
    def registry(self):
        # type: () -> str
        """
        Obtains the registry entry that must be used for ``docker login {registry}``.
        """
        return dict.__getitem__(self, "registry")


    @property

[docs]
    def reference(self):
        # type: () -> str
        """
        Obtains the full reference required when doing :term:`Docker` operations such as ``docker pull {reference}``.
        """
        img = self.image if self.registry == self.DOCKER_REGISTRY_DEFAULT_URI else f"{self.registry}/{self.image}"
        if ":" not in self.image:
            return f"{img}:latest"
        return img



[docs]
    docker = reference  # backward compatibility


    @property

[docs]
    def repository(self):
        # type: () -> str
        """
        Obtains the full :term:`Docker` repository reference without any tag.
        """
        return self.reference.rsplit(":", 1)[0]


    @property

[docs]
    def tag(self):
        # type: () -> Optional[str]
        """
        Obtain the requested tag from the :term:`Docker` reference.
        """
        repo_tag = self.image.rsplit(":", 1)
        if len(repo_tag) < 2:
            return None
        return repo_tag[-1]



[docs]
    def params(self):
        # type: () -> AnyParams
        params = super(DockerAuthentication, self).params()
        params.update({"image": self.image, "registry": self.registry})
        return params





[docs]
class VaultFile(Authentication):
    """
    Dictionary that contains :term:`Vault` file and its authentication information.
    """


[docs]
    type = AuthenticationTypes.VAULT


[docs]
    bytes = 32


    def __init__(self, file_name="", file_format=None, file_secret=None, auth_token=None, **kwargs):
        # type: (str, Optional[str], Optional[str], Optional[str], **Any) -> None
        for key in ["type", "scheme", "link", "token"]:
            kwargs.pop(f"auth_{key}", None)
            kwargs.pop(key, None)
        if not file_name:
            kwargs.setdefault("name", "")
        if file_format:
            kwargs["format"] = file_format
        elif not kwargs.get("format"):
            kwargs.pop("format", None)  # avoid error setting None from reload
        if file_secret:
            kwargs["secret"] = file_secret
        super(VaultFile, self).__init__(
            auth_scheme="token",
            auth_link=None,  # don't care
            auth_token=auth_token or token_hex(VaultFile.bytes),
            **kwargs
        )

    @classmethod

[docs]
    def authorized(cls, file, token):
        # type: (Optional[VaultFile], Optional[str]) -> bool
        """
        Determine whether the file access is authorized.

        This method should be employed to validate access and reduce impact of timing attack analysis.
        """
        default = VaultFile("")
        access = file.token if file else default.token
        return compare_digest(str(access), str(token))



[docs]
    def encrypt(self, file):
        # type: (IO[Union[bytes, str]]) -> BytesIO
        """
        Encrypt file data using a secret to avoid plain text contents during temporary :term:`Vault` storage.

        .. note::
            This is not intended to be a *strong* security countermeasure as contents can still be decrypted at any
            time if provided with the right secret. This is only to slightly obfuscate the contents while it transits
            between storage phases until destruction by the consuming process.
        """
        file.seek(0)
        data = file.read()
        value = data.encode("utf-8") if isinstance(data, str) else data
        digest = Fernet(self.secret).encrypt(value)
        return BytesIO(digest)



[docs]
    def decrypt(self, file):
        # type: (IO[Union[bytes, str]]) -> BytesIO
        """
        Decrypt file contents using secret.
        """
        file.seek(0)
        data = file.read()
        data = data.encode("utf-8") if isinstance(data, str) else data
        value = Fernet(self.secret).decrypt(data)
        return BytesIO(value)


    @property

[docs]
    def secret(self):
        # type: () -> bytes
        """
        Secret associated to this :term:`Vault` file to hash contents back and forth.
        """
        secret = self.get("secret")
        if not secret:
            secret = self["secret"] = Fernet.generate_key()
        return secret


    @secret.setter
    def secret(self, secret):
        # type: (Union[bytes, str]) -> None
        if not secret or not isinstance(secret, (bytes, str)):
            raise ValueError(f"Invalid '{self.__name__}.secret' must be bytes or string.")
        if isinstance(secret, str):
            secret = base64.urlsafe_b64encode(secret.encode())
        self["secret"] = secret

    @property

[docs]
    def id(self):
        # type: () -> uuid.UUID
        """
        Vault file UUID to retrieve the details from storage.
        """
        file_id = self.get("id")
        if not file_id:
            file_id = uuid.uuid4()
            self["id"] = file_id
        if isinstance(file_id, str):
            return uuid.UUID(file_id)
        return file_id


    @property

[docs]
    def name(self):
        # type: () -> str
        """
        Name to retrieve the file.
        """
        return dict.__getitem__(self, "name")


    @name.setter
    def name(self, name):
        # type: (str) -> None
        if not isinstance(name, str):
            raise TypeError(f"Type 'str' is required for '{self.__name__}.name'")
        self["name"] = name

    @property

[docs]
    def format(self):
        # type: () -> Optional[str]
        """
        Format Media-Type of the file.
        """
        return dict.get(self, "format", None)


    @format.setter
    def format(self, media_type):
        # type: (str) -> None
        if not isinstance(media_type, str):
            raise TypeError(f"Type 'str' is required for '{self.__name__}.format'")
        self["format"] = media_type

    @property

[docs]
    def href(self):
        # type: () -> str
        """
        Obtain the vault input reference corresponding to the file.

        This corresponds to the ``href`` value to be provided when submitting an input that should be updated using
        the vault file of specified UUID and using the respective authorization token in ``X-Auth-Vault`` header.
        """
        return f"vault://{self.id!s}"



[docs]
    def json(self):
        # type: () -> JSON
        body = {
            "file_id": self.id,
            "file_href": self.href,
            "access_token": self.token,
        }
        return sd.VaultFileUploadedBodySchema().deserialize(body)



[docs]
    def params(self):
        # type: () -> AnyParams
        return {
            "id": self.id,
            "name": self.name,
            "format": self.format,
            "type": self.type.value,
            "token": self.token,
            "secret": self.secret,
            "scheme": self.scheme,
        }





[docs]
class Process(Base):
    # pylint: disable=C0103,invalid-name
    """
    Dictionary that contains a process definition for db storage.

    It always has ``identifier`` (or ``id`` alias) and a ``package`` definition.
    Parameters can be accessed by key or attribute, and appropriate validators or default values will be applied.
    """

    def __init__(self, *args, **kwargs):
        # type: (*Any, **Any) -> None
        super(Process, self).__init__(*args, **kwargs)
        # use both 'id' and 'identifier' to support any call (WPS and recurrent 'id')
        if "id" not in self and "identifier" not in self:
            raise TypeError("'id' OR 'identifier' is required")
        if "id" not in self:
            self.id = self.pop("identifier")
        if "package" not in self:
            raise TypeError("'package' is required")


[docs]
    def _get_id(self):
        # type: () -> str
        return dict.__getitem__(self, "id")



[docs]
    def _set_id(self, _id):
        # type: (str) -> None
        self["id"] = _id


    id = identifier = property(
        _get_id,  # type: ignore
        _set_id,  # type: ignore
        doc="Unique process identifier with optional version number if it corresponds to an older revision.",
    )

    @classmethod

[docs]
    def split_version(cls, process_id):
        # type: (str) -> Tuple[str, Optional[str]]
        """
        Split the tagged version from the :term:`Process` identifier considering any required special handling.

        :returns: Process ID (only) and the version if any was available in tagged reference.
        """
        # note::
        #   Consider 'urn:...' prefix that could cause ':' characters to be present although maybe no version in ID?
        #   Mot currently permitted due to schema validation parsing of ID on deploy, but could become permitted...
        result = process_id.rsplit(":", 1)
        if not len(result) == 2:
            return process_id, None
        p_id, version = result
        return (p_id, version) if all(str.isnumeric(part) for part in version.split(".")) else (process_id, None)


    @property

[docs]
    def latest(self):
        # type: () -> bool
        """
        Checks if this :term:`Process` corresponds to the latest revision.
        """
        # if ID loaded from DB contains a version, it is not the latest by design
        return self.split_version(self.id)[-1] is None


    @property

[docs]
    def name(self):
        # type: () -> str
        """
        Obtain only the :term:`Process` name portion of the unique identifier.
        """
        if self.version:
            return self.split_version(self.id)[0]
        return self.id


    @property

[docs]
    def tag(self):
        # type: () -> str
        """
        Full identifier including the version for a unique reference.
        """
        proc_id = self.split_version(self.id)[0]
        # bw-compat, if no version available, no update was applied (single deploy)
        # there is no need to define a tag as only one result can be found
        # on next (if any) update request, this revision will be updated with a default version
        if self.version is None:
            return proc_id
        version = as_version_major_minor_patch(self.version, VersionFormat.STRING)
        return f"{proc_id}:{version}"


    @property

[docs]
    def title(self):
        # type: () -> str
        return self.get("title", self.id)


    @title.setter
    def title(self, title):
        # type: (str) -> None
        self["title"] = title


[docs]
    def _get_desc(self):
        # type: () -> str
        # OGC-API-Processes v1 field representation use 'description'
        # bw-compat with existing processes that defined it as abstract
        return self.get("abstract", "") or self.get("description", "")



[docs]
    def _set_desc(self, description):
        # type: (str) -> None
        self["abstract"] = description


    description = abstract = property(
        fget=_get_desc,     # type: ignore
        fset=_set_desc,     # type: ignore
        doc="Process description.",
    )

    @property

[docs]
    def keywords(self):
        # type: () -> List[str]
        keywords = self.setdefault("keywords", [])
        if self.type not in keywords:
            keywords.append(self.type)
            self["keywords"] = keywords
        return dict.__getitem__(self, "keywords")


    @keywords.setter
    def keywords(self, keywords):
        # type: (List[str]) -> None
        self["keywords"] = list(set(sd.KeywordList().deserialize(keywords)))

    @property

[docs]
    def metadata(self):
        # type: () -> List[Metadata]
        return self.get("metadata", [])


    @metadata.setter
    def metadata(self, metadata):
        # type: (List[Metadata]) -> None
        self["metadata"] = sd.MetadataList().deserialize(metadata)

    @property

[docs]
    def version(self):
        # type: () -> Optional[str]
        return self.get("version")


    @version.setter
    def version(self, version):
        # type: (AnyVersion) -> None
        if not isinstance(version, str):
            version = as_version_major_minor_patch(version, VersionFormat.STRING)
        self["version"] = sd.Version().deserialize(version)

    @property

[docs]
    def inputs(self):
        # type: () -> Optional[List[Dict[str, JSON]]]
        """
        Inputs of the process following backward-compatible conversion of stored parameters.

        According to `OGC-API`, ``maxOccurs`` and ``minOccurs`` representations should be:
            - ``maxOccurs``: ``int`` or ``"unbounded"``
            - ``minOccurs``: ``int``

        And, ``mediaType`` should be in description as:
            - ``mediaType``: ``string``

        .. note::
            Because of pre-registered/deployed/retrieved remote processes, inputs are formatted in-line
            to respect valid OGC-API schema representation and apply any required correction transparently.
        """
        inputs = self.get("inputs")
        if inputs is not None:
            for _input in inputs:
                input_formats = get_field(_input, "formats", search_variations=False, default=[])
                for fmt in input_formats:
                    mime_type = get_field(fmt, "mime_type", search_variations=True, pop_found=True)
                    if mime_type is not null:
                        fmt["mediaType"] = mime_type
                input_min = get_field(_input, "min_occurs", search_variations=True, pop_found=True, default=1)
                input_max = get_field(_input, "max_occurs", search_variations=True, pop_found=True, default=1)
                _input["minOccurs"] = int(input_min)
                _input["maxOccurs"] = int(input_max) if input_max != "unbounded" else input_max
                input_desc = get_field(_input, "abstract", search_variations=True, pop_found=True)
                if input_desc:
                    _input["description"] = input_desc
                input_schema = get_field(_input, "schema", search_variations=False)
                if isinstance(input_schema, dict):
                    _input["schema"] = self._decode(input_schema)
        return inputs


    @inputs.setter
    def inputs(self, inputs):
        # type: (List[Dict[str, JSON]]) -> None
        if not isinstance(inputs, list):
            raise TypeError("Inputs container expected as list to normalize process definitions.")
        self["inputs"] = inputs

    @property

[docs]
    def outputs(self):
        # type: () -> Optional[List[Dict[str, JSON]]]
        """
        Outputs of the process following backward-compatible conversion of stored parameters.

        According to `OGC-API`, ``mediaType`` should be in description as:
            - ``mediaType``: ``string``

        .. note::
            Because of pre-registered/deployed/retrieved remote processes, inputs are formatted in-line
            to respect valid OGC-API schema representation and apply any required correction transparently.
        """
        outputs = self.get("outputs", [])
        for _output in outputs:
            output_formats = get_field(_output, "formats", search_variations=False, default=[])
            for fmt in output_formats:
                mime_type = get_field(fmt, "mime_type", pop_found=True, search_variations=True)
                if mime_type is not null:
                    fmt["mediaType"] = mime_type
            output_desc = get_field(_output, "abstract", search_variations=True, pop_found=True)
            if output_desc:
                _output["description"] = output_desc
            output_schema = get_field(_output, "schema", search_variations=False)
            if isinstance(output_schema, dict):
                _output["schema"] = self._decode(output_schema)
        return outputs


    @outputs.setter
    def outputs(self, outputs):
        # type: (List[Dict[str, JSON]]) -> None
        if not isinstance(outputs, list):
            raise TypeError("Outputs container expected as list to normalize process definitions.")
        self["outputs"] = outputs

    @property

[docs]
    def jobControlOptions(self):  # noqa: N802
        # type: () -> List[AnyExecuteControlOption]
        """
        Control options that indicate which :term:`Job` execution modes are supported by the :term:`Process`.

        .. note::
            There are no official mentions about the ordering of ``jobControlOptions``.
            Nevertheless, it is often expected that the first item can be considered the default mode when none is
            requested explicitly (at execution time). With the definition of execution mode through the ``Prefer``
            header, `Weaver` has the option to decide if it wants to honor this header, according to available
            resources and :term:`Job` duration.

            For this reason, ``async`` is placed first by default when nothing was defined during deployment,
            since it is the preferred mode in `Weaver`. If deployment included items though, they are preserved as is.
            This allows to re-deploy a :term:`Process` to a remote non-`Weaver` :term:`ADES` preserving the original
            :term:`Process` definition.

        .. seealso::
            Discussion about expected ordering of ``jobControlOptions``:
            https://github.com/opengeospatial/ogcapi-processes/issues/171#issuecomment-836819528
        """
        # Weaver's default async only, must override explicitly during deploy if sync is needed
        jco_default = [ExecuteControlOption.ASYNC]
        jco = self.setdefault("jobControlOptions", jco_default)
        if not isinstance(jco, list):  # eg: None, bw-compat
            jco = jco_default
        jco = [ExecuteControlOption.get(opt) for opt in jco]
        jco = [opt for opt in jco if opt is not None]
        if len(jco) == 0:
            jco = jco_default
        self["jobControlOptions"] = jco  # no alpha order important!
        return dict.__getitem__(self, "jobControlOptions")


    @property

[docs]
    def outputTransmission(self):  # noqa: N802
        # type: () -> List[AnyExecuteTransmissionMode]
        out = self.setdefault("outputTransmission", ExecuteTransmissionMode.values())
        if not isinstance(out, list):  # eg: None, bw-compat
            out = [ExecuteTransmissionMode.VALUE]
        out = [ExecuteTransmissionMode.get(mode) for mode in out]
        out = [mode for mode in out if mode is not None]
        if len(out) == 0:
            out.extend(ExecuteTransmissionMode.values())
        self["outputTransmission"] = list(sorted(out))
        return dict.__getitem__(self, "outputTransmission")


    @property

[docs]
    def processDescriptionURL(self):  # noqa: N802
        # type: () -> Optional[str]
        return self.get("processDescriptionURL")


    @property

[docs]
    def processEndpointWPS1(self):  # noqa: N802
        # type: () -> Optional[str]
        return self.get("processEndpointWPS1")


    @property

[docs]
    def executeEndpoint(self):  # noqa: N802
        # type: () -> Optional[str]
        return self.get("executeEndpoint")


    @property

[docs]
    def owsContext(self):  # noqa: N802
        # type: () -> Optional[JSON]
        return self.get("owsContext")


    # wps, workflow, etc.
    @property

[docs]
    def type(self):
        # type: () -> AnyProcessType
        """
        Type of process amongst :mod:`weaver.processes.types` definitions.
        """
        return self.get("type", ProcessType.APPLICATION)


    @property

[docs]
    def mutable(self):
        # type: () -> bool
        """
        Indicates if a process can be modified.
        """
        return self.type != ProcessType.BUILTIN


    @property

[docs]
    def deployment_profile(self):
        # type: () -> str
        from weaver.processes.wps_package import get_application_requirement

        base = "http://www.opengis.net/profiles/eoc/"
        pkg = self.package or {}
        cls = str(pkg.get("class", "")).lower()
        req = get_application_requirement(pkg, required=False).get("class")
        typ = self.type

        if cls == ProcessType.WORKFLOW:
            profile = f"{base}workflow"
        elif ProcessType.is_wps(typ) or req in [
            CWL_REQUIREMENT_APP_WPS1,
            f"{CWL_NAMESPACE_WEAVER_ID}:{CWL_REQUIREMENT_APP_WPS1}",
        ]:
            profile = f"{base}wpsApplication"
        elif typ == ProcessType.OGC_API or req in [
            CWL_REQUIREMENT_APP_OGC_API,
            f"{CWL_NAMESPACE_WEAVER_ID}:{CWL_REQUIREMENT_APP_OGC_API}",
        ]:
            profile = f"{base}ogcapiApplication"
        elif typ == ProcessType.APPLICATION or req in [
            CWL_REQUIREMENT_APP_DOCKER,
            CWL_REQUIREMENT_APP_DOCKER_GPU,
        ]:
            profile = f"{base}dockerizedApplication"
        else:
            profile = base + typ
        return profile


    @property

[docs]
    def package(self):
        # type: () -> Optional[CWL]
        """
        Package :term:`CWL` definition as :term:`JSON`.
        """
        pkg = self.get("package")
        return self._decode(pkg) if isinstance(pkg, dict) else pkg


    @package.setter
    def package(self, pkg):
        # type: (Optional[CWL]) -> None
        self["package"] = self._decode(pkg) if isinstance(pkg, dict) else pkg

    @property

[docs]
    def payload(self):
        # type: () -> JSON
        """
        Deployment specification as :term:`JSON`.
        """
        body = self.get("payload", {})
        return self._decode(body) if isinstance(body, dict) else body


    @payload.setter
    def payload(self, body):
        # type: (JSON) -> None
        self["payload"] = self._encode(body) if isinstance(body, dict) else {}

    # encode(->)/decode(<-) characters that cannot be in a key during save to db

[docs]
    _character_codes = [("$", "\uFF04"), (".", "\uFF0E")]


    @staticmethod

[docs]
    def _recursive_replace(pkg, index_from, index_to):
        # type: (JSON, int, int) -> JSON
        new = {}
        for k in pkg:
            # find modified key with replace matches
            c_k = k
            for c in Process._character_codes:
                c_f = c[index_from]
                c_t = c[index_to]
                if c_f in k:
                    c_k = k.replace(c_f, c_t)
            # process recursive sub-items
            if isinstance(pkg[k], dict):
                pkg[k] = Process._recursive_replace(pkg[k], index_from, index_to)
            if isinstance(pkg[k], list):
                for i, pkg_i in enumerate(pkg[k]):
                    if isinstance(pkg_i, dict):
                        pkg[k][i] = Process._recursive_replace(pkg[k][i], index_from, index_to)
            # apply new key to obtained sub-items with replaced keys as needed
            new[c_k] = pkg[k]   # note: cannot use pop when using pkg keys iterator (python 3)
        return new


    @staticmethod

[docs]
    def _encode(obj):
        # type: (Optional[JSON]) -> Optional[JSON]
        if obj is None:
            return None
        return Process._recursive_replace(obj, 0, 1)


    @staticmethod

[docs]
    def _decode(obj):
        # type: (Optional[JSON]) -> Optional[JSON]
        if obj is None:
            return None
        return Process._recursive_replace(obj, 1, 0)


    @property

[docs]
    def estimator(self):
        # type: () -> JSON
        return self.get("estimator") or {}


    @estimator.setter
    def estimator(self, estimator):
        # type: (Optional[JSON]) -> None
        if not isinstance(estimator, dict) or estimator is None:
            raise ValueError(
                f"Estimator value '{estimator}' is not valid for '{self.__name__}.estimator'. Must be JSON."
            )
        self["estimator"] = estimator

    @property

[docs]
    def visibility(self):
        # type: () -> Visibility
        return Visibility.get(self.get("visibility"), Visibility.PUBLIC)


    @visibility.setter
    def visibility(self, visibility):
        # type: (AnyVisibility) -> None
        vis = Visibility.get(visibility)
        if vis not in Visibility:
            values = list(Visibility.values())
            raise ValueError(
                f"Status '{visibility}' is not valid for '{self.__name__}.visibility, must be one of {values!s}'"
            )
        self["visibility"] = vis

    @property

[docs]
    def auth(self):
        # type: () -> Optional[AnyAuthentication]
        """
        Authentication token required for operations with the process.
        """
        auth = self.get("auth", None)
        if isinstance(auth, Authentication):
            return auth
        if isinstance(auth, dict):
            auth = Authentication.from_params(**auth)
            self["auth"] = auth  # store for later reference without reprocess
            return auth
        return None


    @auth.setter
    def auth(self, auth):
        # type: (Optional[AnyAuthentication]) -> None
        if auth is None:
            return
        if isinstance(auth, dict):
            auth = Authentication(**auth)
        if not isinstance(auth, Authentication):
            name = fully_qualified_name(auth)
            raise TypeError(f"Type 'Authentication' is required for '{self.__name__}.auth', not '{name}'.")
        self["auth"] = auth


[docs]
    def params(self):
        # type: () -> AnyParams
        return {
            "identifier": self.identifier,
            "title": self.title,
            "abstract": self.abstract,
            "keywords": self.keywords,
            "metadata": self.metadata,
            "version": self.version,
            "additional_links": self.additional_links,
            # escape potential OpenAPI JSON $ref in 'schema' also used by Mongo BSON
            "inputs": [self._encode(_input) for _input in self.inputs or []],
            "outputs": [self._encode(_output) for _output in self.outputs or []],
            "jobControlOptions": self.jobControlOptions,
            "outputTransmission": self.outputTransmission,
            "processEndpointWPS1": self.processEndpointWPS1,
            "processDescriptionURL": self.processDescriptionURL,
            "executeEndpoint": self.executeEndpoint,
            "owsContext": self.owsContext,
            "type": self.type,
            "package": self._encode(self.package),
            "payload": self._encode(self.payload),
            "visibility": self.visibility,
            "auth": self.auth.params() if self.auth else None,
            "estimator": self.estimator or None,
        }


    @property

[docs]
    def params_wps(self):
        # type: () -> AnyParams
        """
        Values applicable to create an instance of :class:`pywps.app.Process`.
        """
        return {
            "identifier": self.identifier,
            "title": self.title,
            "abstract": self.abstract,
            "keywords": self.keywords,
            "metadata": self.metadata,
            "version": self.version,
            "inputs": self.inputs,
            "outputs": self.outputs,
            "package": self.package,
            "payload": self.payload,
        }



[docs]
    def dict(self):
        # type: () -> AnyParams
        data = super(Process, self).dict()
        data.pop("auth", None)  # remote preemptively just in case any deserialize fails to drop it
        return data



[docs]
    def json(self):
        # type: () -> JSON
        """
        Obtains the JSON serializable complete representation of the process.
        """
        return sd.Process().deserialize(self.dict())



[docs]
    _links = property(
        fget=lambda self: self.get("_links", []),
        fset=lambda self, value: dict.__setitem__(self, "_links", value),
        doc="Cache pre-computed links."
    )



[docs]
    def links(self, container=None):
        # type: (Optional[AnySettingsContainer]) -> List[Link]
        """
        Obtains the JSON links section of many response body for the :term:`Process`.

        :param container: object that helps retrieve instance details, namely the host URL.
        """
        from weaver.database import get_db

        if self._links:  # save re-computation time if already done
            return self._links

        proc_desc = self.href(container)
        proc_list = proc_desc.rsplit("/", 1)[0]
        jobs_list = proc_desc + sd.jobs_service.path
        proc_exec = f"{proc_desc}/execution"
        proc_self = f"{proc_list}/{self.tag}" if self.version else proc_desc
        links = [
            {"href": proc_self, "rel": "self", "title": "Current process description."},
            {"href": sd.OGC_API_PROC_PROFILE_PROC_DESC_URI, "rel": "profile", "title": "Process response profile."},
            {"href": f"{proc_desc}?f=xml", "rel": "alternate",
             "title": "Alternate process description.", "type": ContentType.APP_XML},
        ]
        if self.service:
            links.append(
                {"href": f"{proc_desc}?f=html", "rel": "alternate",
                 "title": "Alternate process description.", "type": ContentType.TEXT_HTML}
            )
        links.extend([
            {"href": proc_desc, "rel": "process-meta", "title": "Process definition."},
            {"href": proc_exec, "rel": sd.OGC_API_PROC_REL_EXECUTE_URI,
             "title": "Process execution endpoint for job submission."},
            {"href": proc_list, "rel": sd.OGC_API_PROC_REL_PROCESSES_URI,
             "title": "List of registered processes."},
            {"href": jobs_list, "rel": sd.OGC_API_PROC_REL_JOB_LIST_URI,
             "title": "List of job executions corresponding to this process."},
            {"href": proc_list, "rel": "up", "title": "List of processes registered under the service."},
        ])
        if self.version:
            # OGC API - Processes - 'Part 5: Versioning' (unofficial)
            # (see https://github.com/opengeospatial/ogcapi-processes/pull/578)
            proc_tag = f"{proc_list}/{self.tag}"
            proc_hist = f"{proc_list}?detail=false&revisions=true&process={self.id}"
            links.extend([
                {"href": proc_tag, "rel": "working-copy", "title": "Tagged version of this process description."},
                {"href": proc_desc, "rel": "latest-version", "title": "Most recent revision of this process."},
                {"href": proc_hist, "rel": "version-history", "title": "Listing of all revisions of this process."},
            ])
            versions = get_db(container).get_store(StoreProcesses).find_versions(self.name, VersionFormat.OBJECT)
            proc_ver = as_version_major_minor_patch(self.version, VersionFormat.OBJECT)
            prev_ver = list(filter(lambda ver: ver < proc_ver, versions))
            next_ver = list(filter(lambda ver: ver > proc_ver, versions))
            if prev_ver:
                proc_prev = f"{proc_desc}:{prev_ver[-1]!s}"
                links.append(
                    {"href": proc_prev, "rel": "predecessor-version", "title": "Previous revision of this process."}
                )
            if next_ver:
                proc_next = f"{proc_desc}:{next_ver[0]!s}"
                links.append(
                    {"href": proc_next, "rel": "successor-version", "title": "Next revision of this process."}
                )
        if self.service:
            api_base_url = proc_list.rsplit("/", 1)[0]
            wps_base_url = self.processEndpointWPS1.split("?")[0]
            wps_get_caps = f"{wps_base_url}?service=WPS&request=GetCapabilities&version=1.0.0"
            wps_links = [
                {"href": api_base_url, "rel": "service", "title": "Provider service description."},
                {"href": api_base_url, "rel": "service-meta", "title": "Provider service definition."},
                {"href": wps_get_caps, "rel": "service-desc", "title": "Remote service description."},
                {"href": self.processEndpointWPS1, "rel": sd.OGC_API_PROC_REL_PROCESS_DESC_URI,
                 "title": "Remote process description."},
            ]
            for link in wps_links:
                link.setdefault("type", ContentType.APP_XML)
            links.extend(wps_links)
        for link in links:
            link.setdefault("type", ContentType.APP_JSON)
            link.setdefault("hreflang", AcceptLanguage.EN_CA)
        # add user-provided additional links, no type/hreflang added since we cannot guess them
        known_links = {link.get("rel") for link in links}
        extra_links = self.additional_links
        extra_links = [link for link in extra_links if link.get("rel") not in known_links]
        links.extend(extra_links)
        self._links = links
        return links


    @property

[docs]
    def additional_links(self):
        # type: () -> List[Link]
        return self.get("additional_links", [])


    @additional_links.setter
    def additional_links(self, links):
        # type: (List[Link]) -> None
        links = sd.LinkList().deserialize(links)
        self["additional_links"] = []  # don't flag an existing rel that is about to be overridden as conflicting
        self._links = []  # need recompute
        all_rel = [link["rel"] for link in self.links()]
        for link in links:
            rel = link["rel"]
            if rel in all_rel:
                raise ValueError(
                    f"Value of '{self.__name__}.additional_links' is not valid. "
                    f"Unique links relations are required but '{rel}' is already taken."
                )
            all_rel.append(rel)
        self["additional_links"] = links
        self._links = []  # need recompute on future call


[docs]
    def href(self, container=None):
        # type: (Optional[AnySettingsContainer]) -> str
        """
        Obtain the reference URL for this :term:`Process`.
        """
        settings = get_settings(container)
        base_url = get_wps_restapi_base_url(settings)
        if self.service:
            base_url += sd.provider_service.path.format(provider_id=self.service)
        proc_desc = base_url + sd.process_service.path.format(process_id=self.id)
        return proc_desc



[docs]
    def offering(self, schema=ProcessSchema.OGC, request=None):
        # type: (ProcessSchemaType, AnyRequestType) -> JSON
        """
        Obtains the :term:`JSON` or :term:`XML` serializable offering/description representation of the :term:`Process`.

        :param request: HTTP request that can provide more details on how to describe the process.
        :param schema:
            One of values defined by :class:`sd.ProcessDescriptionSchemaQuery` to select which
            process description representation to generate (see each schema for details).

        .. note::
            Property name ``offering`` is employed to differentiate from the string process ``description`` field.
            The result of this JSON representation is still the ``ProcessDescription`` schema.
        """
        if schema == ProcessSchema.WPS:
            return self.xml(request)

        process = copy.deepcopy(self.dict())
        links = self.links()
        process.update({
            "deploymentProfile": self.deployment_profile,
            "links": links
        })

        # adjust I/O definitions with missing information for both representations
        io_hints = {}
        for io_type in ["inputs", "outputs"]:
            io_hints[io_type] = process[io_type]
            process[io_type] = {
                get_field(io_def, "identifier", search_variations=True): io_def
                for io_def in process[io_type]
            }
            # When OpenAPI schema is not predefined explicitly in deployed I/O definitions, generate them dynamically.
            # This call allow to fill missing details for preexisting (already deployed) processes in database.
            # Another possible case is a deployment providing only CWL definitions, and WPS are inferred from them.
            # In this situation, the lack of WPS I/O altogether requires to generate OAS from I/O merge/conversion.
            # Deployment with OAS should have generated this field already to save time or for more precise definitions.
            for io_def in process[io_type].values():
                if io_type == "outputs":
                    formats = io_def.get("formats", [])
                    if formats:
                        io_def["formats"] = extend_alternate_formats(formats)
                io_schema = get_field(io_def, "schema", search_variations=False)
                if not isinstance(io_schema, dict):
                    io_def["schema"] = json2oas_io(io_def)

        # force selection of schema to avoid ambiguity
        if str(schema or ProcessSchema.OGC).upper() == ProcessSchema.OLD:
            # fields nested under 'process' + I/O as lists
            for io_type in ["inputs", "outputs"]:
                process[io_type] = normalize_ordered_io(process[io_type], io_hints[io_type])
            process.update({"process": dict(process)})
            return sd.ProcessDescriptionOLD(schema_meta_include=True).deserialize(process)
        # process fields directly at root + I/O as mappings
        return sd.ProcessDescriptionOGC(schema_meta_include=True).deserialize(process)



[docs]
    def summary(self, revision=False, links=True, container=None):
        # type: (bool, bool, Optional[AnySettingsContainer]) -> JSON
        """
        Obtains the JSON serializable summary representation of the process.

        :param revision: Replace the process identifier by the complete tag representation.
        :param links: Include process links in summary.
        :param container: Application settings or database container to retrieve links and avoid reconnections.
        """
        data = self.dict()
        if revision:
            data["id"] = self.tag
        if links:
            data["links"] = self.links(container=container)
        return sd.ProcessSummary().deserialize(data)


    @staticmethod

[docs]
    def from_wps(wps_process, **extra_params):
        # type: (ProcessWPS, **Any) -> Process
        """
        Converts a :mod:`pywps` Process into a :class:`weaver.datatype.Process` using provided parameters.
        """
        assert isinstance(wps_process, ProcessWPS)
        process = wps_process.json
        process_type = getattr(wps_process, "type", wps_process.identifier)
        process.update({"type": process_type, "package": None, "reference": None,
                        "inputs": [wps2json_io(i) for i in wps_process.inputs],
                        "outputs": [wps2json_io(o) for o in wps_process.outputs]})
        process.update(**extra_params)
        return Process(process)


    @staticmethod

[docs]
    def from_ows(process, service, container, **kwargs):
        # type: (ProcessOWS, Service, AnySettingsContainer, **Any) -> Process
        """
        Converts a :mod:`owslib.wps` Process to local storage :class:`weaver.datatype.Process`.
        """
        assert isinstance(process, ProcessOWS)
        wps_xml_url = get_wps_url(container)
        wps_api_url = get_wps_restapi_base_url(container)
        svc_name = None
        if not service or wps_api_url == service.url:
            # local weaver process, using WPS-XML endpoint
            remote_service_url = wps_xml_url
            local_provider_url = wps_api_url
            svc_provider_name = "Weaver"
        else:
            svc_name = service.get("name")  # can be a custom ID or identical to provider name
            remote_service_url = service.url
            local_provider_url = f"{wps_api_url}/providers/{svc_name}"
            svc_provider_name = service.wps(container).provider.name
        describe_process_url = f"{local_provider_url}/processes/{process.identifier}"
        execute_process_url = f"{describe_process_url}/jobs"
        package, info = ows2json(process, svc_name, remote_service_url, svc_provider_name)
        wps_query = f"service=WPS&request=DescribeProcess&version=1.0.0&identifier={process.identifier}"
        wps_description_url = f"{remote_service_url}?{wps_query}"
        kwargs.update({  # parameters that must be enforced to find service
            "url": describe_process_url,
            "executeEndpoint": execute_process_url,
            "processEndpointWPS1": wps_description_url,
            "processDescriptionURL": describe_process_url,
            "type": ProcessType.WPS_REMOTE,
            "package": package,
            "service": svc_name
        })
        return Process(**info, **kwargs)


    @property

[docs]
    def service(self):
        # type: () -> Optional[str]
        """
        Name of the parent service provider under which this process resides.

        .. seealso::
            - :meth:`Service.processes`
            - :meth:`Process.convert`
        """
        return self.get("service", None)


    @service.setter
    def service(self, service):
        # type: (Optional[str]) -> None
        if not (isinstance(service, str) or service is None):
            raise TypeError(f"Type 'str' is required for '{self.__name__}.service'")
        self["service"] = service

    @staticmethod

[docs]
    def convert(process, service=None, container=None, **kwargs):
        # type: (AnyProcess, Optional[Service], Optional[AnySettingsContainer], **Any) -> Process
        """
        Converts known process equivalents definitions into the formal datatype employed by Weaver.
        """
        if isinstance(process, ProcessOWS):
            return Process.from_ows(process, service, container, **kwargs)
        if isinstance(process, ProcessWPS):
            return Process.from_wps(process, **kwargs)
        if isinstance(process, dict):
            return Process(process, **kwargs)
        if isinstance(process, Process):
            return process
        raise TypeError(f"Unknown process type to convert: [{fully_qualified_name(process)}]")



[docs]
    def xml(self, request):
        # type: (AnyRequestType) -> str
        """
        Obtain the raw :term:`XML` representation of the :term:`Process` using :term:`WPS` schema.
        """
        # make sure 'accept_mimetypes' can be found if missing from the provided request implementation
        http_request = extend_instance(request, WerkzeugRequest)  # type: Union[AnyRequestType, WerkzeugRequest]
        wps_request = WPSRequest()
        wps_request.language = http_request.accept_language.header_value or AcceptLanguage.EN_CA
        wps_request.http_request = http_request  # set instead of init param to bypass extra setup arguments
        processes = {self.id: self.wps(request)}
        describer = DescribeResponse(wps_request, uuid=None, processes=processes, identifiers=list(processes))
        offering, _ = describer.get_response_doc()
        return offering



[docs]
    def wps(self, container=None):
        # type: (Optional[AnySettingsContainer]) -> ProcessWPS
        """
        Converts this :class:`Process` to a corresponding format understood by :mod:`pywps`.
        """
        # import here to avoid circular import errors
        from weaver.processes.wps_default import HelloWPS
        from weaver.processes.wps_package import WpsPackage
        from weaver.processes.wps_testing import WpsTestProcess

        process_map = {
            HelloWPS.identifier: HelloWPS,
            ProcessType.TEST: WpsTestProcess,
            ProcessType.APPLICATION: WpsPackage,    # single CWL package
            ProcessType.BUILTIN: WpsPackage,        # local scripts
            ProcessType.WPS_REMOTE: WpsPackage,     # remote WPS
            ProcessType.WORKFLOW: WpsPackage,       # chaining of CWL packages
        }

        process_key = self.type
        if self.type == ProcessType.WPS_LOCAL:
            process_key = self.identifier
        if process_key not in process_map:
            raise ProcessInstanceError(f"Unknown process '{process_key}' in mapping.")
        settings = get_settings(container)
        return process_map[process_key](**self.params_wps, settings=settings)





[docs]
class PriceMixin(Base, abc.ABC):
    @property

[docs]
    def amount(self):
        # type: () -> Decimal
        """
        Amount of the current quote.
        """
        return Decimal(str(self.get("amount", "0.0")))


    @amount.setter
    def amount(self, amount):
        # type: (Union[Decimal, float, str]) -> None
        if not isinstance(amount, Decimal):
            try:
                amount = Decimal(str(amount))
            except (ConversionSyntax, ValueError, TypeError):
                raise ValueError(f"Field '{self.__name__}.amount' must be a floating point number.")
        self["amount"] = amount

    @property

[docs]
    def currency(self):
        # type: () -> str
        """
        Currency of the quote price.
        """
        currency = self.get("currency")
        return currency or "USD"


    @currency.setter
    def currency(self, currency):
        # type: (str) -> None
        if not isinstance(currency, str) or not re.match(r"^[A-Z]{3}$", currency):
            raise ValueError(f"Field '{self.__name__}.currency' must be an ISO-4217 currency string code.")
        self["currency"] = currency

    @property

[docs]
    def price(self):
        # type: () -> Price
        return {"amount": self.amount, "currency": self.currency}


    @price.setter
    def price(self, price):
        # type: (Price) -> None
        self.amount = price["amount"]
        self.currency = price["currency"]




[docs]
class Quote(PriceMixin, Base):
    """
    Dictionary that contains quote information.

    It always has ``id`` and ``process`` keys.
    """

    # pylint: disable=C0103,invalid-name

    def __init__(self, *args, **kwargs):
        # type: (*Any, **Any) -> None
        """
        Initialize the quote.

        .. note::
            Although many parameters are required to render the final quote, they are not enforced
            at creation since the partial quote definition is needed before it can be processed.
        """
        super(Quote, self).__init__(*args, **kwargs)
        # set defaults
        if "status" not in self:
            self["status"] = QuoteStatus.SUBMITTED
        if "created" not in self:
            self["created"] = now()
        if "expire" not in self:
            self["expire"] = now() + timedelta(days=1)
        if "id" not in self:
            self["id"] = uuid.uuid4()

    # NOTE:
    #   Assume that a quote payment would be submitted and validated by an external operation.
    #   Do not allow it within the scope of this object to avoid incorrect handling/reporting.
    #   Only allow it when creating the object, which would be loaded from the database with
    #   external payment applied beforehand if provided.

    def __setitem__(self, key, value):
        if key == "paid":
            warnings.warn("Quote payment immutable.", UnsupportedOperationWarning)
            return
        super(Quote, self).__setitem__(key, value)

    def __setattr__(self, key, value):
        if key == "paid":
            warnings.warn("Quote payment immutable.", UnsupportedOperationWarning)
            return
        super(Quote, self).__setattr__(key, value)


[docs]
    def setdefault(self, key, default):  # noqa
        if key == "paid":
            warnings.warn("Quote payment immutable.", UnsupportedOperationWarning)
            return
        super(Quote, self).setdefault(key, default)



[docs]
    def update(self, mapping, **__):
        if mapping.pop("paid", None) is not None:
            warnings.warn("Quote payment immutable.", UnsupportedOperationWarning)
        super(Quote, self).update(mapping, **__)


    @property

[docs]
    def paid(self):
        # type: () -> bool
        return self.get("paid", False)


    @paid.setter
    def paid(self, _):
        warnings.warn("Quote payment immutable.", UnsupportedOperationWarning)

    @property

[docs]
    def id(self):
        # type: () -> uuid.UUID
        """
        Quote ID.
        """
        return dict.__getitem__(self, "id")


    @property

[docs]
    def detail(self):
        # type: () -> Optional[str]
        return self.get("detail")


    @detail.setter
    def detail(self, detail):
        # type: (str) -> None
        if detail is None and self.detail is not None:
            return
        if not isinstance(detail, str):
            raise TypeError(f"String required for '{self.__name__}.detail'.")
        self["detail"] = detail

    @property

[docs]
    def status(self):
        # type: () -> QuoteStatus
        return QuoteStatus.get(self.get("status"), QuoteStatus.SUBMITTED)


    @status.setter
    def status(self, status):
        # type: (AnyQuoteStatus) -> None
        value = QuoteStatus.get(status)
        if value not in QuoteStatus:
            statuses = list(QuoteStatus.values())
            name = self.__name__
            raise ValueError(f"Status '{status}' is not valid for '{name}.status', must be one of {statuses!s}'")
        prev = self.status
        if (
            (value == QuoteStatus.SUBMITTED and prev != QuoteStatus.SUBMITTED) or
            (value == QuoteStatus.PROCESSING and prev == QuoteStatus.COMPLETED)
        ):
            LOGGER.error("Cannot revert to previous quote status (%s => %s)", value, self.status)
            LOGGER.debug(traceback.extract_stack())
            return
        self["status"] = value

    @property

[docs]
    def user(self):
        # type: () -> Optional[Union[str, int]]
        """
        User ID requesting the quote.
        """
        return dict.__getitem__(self, "user")


    @user.setter
    def user(self, user):
        # type: (Optional[Union[str, int]]) -> None
        if not isinstance(user, (str, int, type(None))):
            raise ValueError(f"Field '{self.__name__}.user' must be a string, integer or None.")
        self["user"] = user

    @property

[docs]
    def process(self):
        # type: () -> str
        """
        Process ID.
        """
        return dict.__getitem__(self, "process")


    @process.setter
    def process(self, process):
        # type: (AnyProcessRef) -> None
        if isinstance(process, Process):
            process = process.tag
        if not isinstance(process, str) or not len(process):
            raise ValueError(f"Field '{self.__name__}.process' must be a string.")
        self["process"] = process

    @property

[docs]
    def seconds(self):
        # type: () -> int
        """
        Estimated time of the process execution in seconds.
        """
        return self.get("seconds") or 0


    @seconds.setter
    def seconds(self, seconds):
        # type: (int) -> None
        if not isinstance(seconds, int):
            raise TypeError(f"Invalid estimated duration type for '{self.__name__}.seconds'.")
        if seconds < 0:
            raise ValueError(f"Invalid estimated duration value for '{self.__name__}.seconds'.")
        self["seconds"] = seconds

    @property

[docs]
    def duration(self):
        # type: () -> timedelta
        """
        Duration as delta time that can be converted to ISO-8601 format (``P[n]Y[n]M[n]DT[n]H[n]M[n]S``).
        """
        return timedelta(seconds=self.seconds)


    @property

[docs]
    def duration_str(self):
        # type: () -> str
        """
        Human-readable duration in formatted as ``hh:mm:ss``.
        """
        duration = self.duration
        if duration is None:
            return "00:00:00"
        return str(duration).split(".", 1)[0].zfill(8)


    @property

[docs]
    def parameters(self):
        # type: () -> QuoteProcessParameters
        """
        Process execution parameters for quote.

        This should include minimally the inputs and expected outputs,
        but could be extended as needed with relevant details for quoting algorithm.
        """
        params = dict.pop(self, "processParameters", None)  # backward compatibility
        if params and "parameters" not in self:
            self.parameters = params
        params = self.get("parameters", {})
        return params


    @parameters.setter
    def parameters(self, data):
        # type: (QuoteProcessParameters) -> None
        try:
            sd.QuoteProcessParameters().deserialize(data)
        except colander.Invalid:
            LOGGER.error("Invalid process parameters for quote submission.\n%s", repr_json(data, indent=2))
            raise TypeError("Invalid process parameters for quote submission.")
        self["parameters"] = data

    processParameters = inputs = parameters  # noqa  # backward compatible alias

    @property

[docs]
    def results(self):
        # type: () -> QuoteProcessResults
        """
        Process execution results following quote estimation.
        """
        return self.get("results") or {}


    @results.setter
    def results(self, data):
        # type: (QuoteProcessResults) -> None
        try:
            results = sd.QuoteProcessResults().deserialize(data)
        except colander.Invalid:
            LOGGER.error("Invalid process results for quote submission.\n%s", repr_json(data, indent=2))
            raise TypeError("Invalid process results for quote submission.")
        self["results"] = results

    @property

[docs]
    def outputs(self):
        # type: () -> QuoteStepOutputParameters
        """
        Quote estimation outputs for a following step quote estimation.
        """
        return self.get("outputs") or {}


    @outputs.setter
    def outputs(self, data):
        # type: (QuoteStepOutputParameters) -> None
        try:
            outputs = sd.QuoteStepOutputParameters().deserialize(data)
        except colander.Invalid:
            LOGGER.error("Invalid quote estimation outputs for next step submission.\n%s", repr_json(data, indent=2))
            raise TypeError("Invalid quote estimation outputs for next step submission.")
        self["outputs"] = outputs


[docs]
    expire = LocalizedDateTimeProperty(doc="Quote expiration datetime.")


[docs]
    created = LocalizedDateTimeProperty(doc="Quote creation datetime.", default_now=True)


    @property

[docs]
    def steps(self):
        # type: () -> List[uuid.UUID]
        """
        Sub-quote IDs if applicable.
        """
        return self.get("steps", [])



[docs]
    def params(self):
        # type: () -> AnyParams
        return {
            "id": self.id,
            "detail": self.detail,
            "status": self.status,
            "paid": self.paid,
            "amount": str(self.amount),  # preserve precision with representation as is
            "currency": self.currency,
            "user": self.user,
            "process": self.process,
            "steps": self.steps,
            "created": self.created,
            "expire": self.expire,
            "seconds": self.seconds,
            "results": self.results,
            "outputs": self.outputs,
            "parameters": self.parameters,
        }



[docs]
    def partial(self):
        # type: () -> JSON
        """
        Submitted :term:`Quote` representation with minimal details until evaluation is completed.
        """
        data = {
            "status": self.status,
            "quoteID": self.id,
            "processID": self.process
        }
        return sd.PartialQuoteSchema().deserialize(data)



[docs]
    def json(self):
        # type: () -> JSON
        """
        Step :term:`Quote` with :term:`JSON` representation.

        .. note::
            Does not include derived :term:`Quote` details if the associated :term:`Process` is a :term:`Workflow`.
        """
        data = self.dict()
        data.update(self.partial())
        data.update({
            "userID": self.user,
            "estimatedTime": self.duration_str,
            "estimatedSeconds": self.seconds,
            "estimatedDuration": self.duration,
            "processParameters": self.parameters,
        })
        return sd.Quotation().deserialize(data)



[docs]
    def links(self, container=None):
        # type: (Optional[AnySettingsContainer]) -> List[Link]
        quote_url = self.href(container)
        base_href = quote_url.rsplit(sd.quotes_service.path, 1)[0]
        proc_href = base_href + sd.process_service.path.format(process_id=self.process)
        exec_href = base_href + sd.process_quote_service.path.format(process_id=self.process, quote_id=self.id)
        links = [
            {"href": quote_url, "rel": "self", "title": "Quote details."},
            {"href": proc_href, "rel": "process-meta", "title": "Process description."},
            {"href": exec_href, "rel": "quotation", "title": "Process execution using quote submission."},
        ]
        return links



[docs]
    def href(self, container=None):
        # type: (Optional[AnySettingsContainer]) -> str
        """
        Obtain the reference URL for this :term:`Quote`.
        """
        settings = get_settings(container)
        base_url = get_wps_restapi_base_url(settings)
        quote_url = base_url + sd.quote_service.path.format(quote_id=self.id)
        return quote_url





[docs]
class Bill(PriceMixin, Base):
    """
    Dictionary that contains bill information.

    It always has ``id``, ``user``, ``quote`` and ``job`` keys.
    """

    def __init__(self, *args, **kwargs):
        super(Bill, self).__init__(*args, **kwargs)
        if "quote" not in self:
            raise TypeError("Field 'Bill.quote' is required")
        if not isinstance(self.get("quote"), str):
            raise ValueError("Field 'Bill.quote' must be a string.")
        if "job" not in self:
            raise TypeError("Field 'Bill.job' is required")
        if not isinstance(self.get("job"), str):
            raise ValueError("Field 'Bill.job' must be a string.")
        if "user" not in self:
            raise TypeError("Field 'Bill.user' is required")
        if not isinstance(self.get("user"), str):
            raise ValueError("Field 'Bill.user' must be a string.")
        if "price" not in self:
            raise TypeError("Field 'Bill.price' is required")
        if not isinstance(self.get("price"), float):
            raise ValueError("Field 'Bill.price' must be a float number.")
        if "currency" not in self:
            raise TypeError("Field 'Bill.currency' is required")
        if not isinstance(self.get("currency"), str) or len(self.get("currency")) != 3:
            raise ValueError("Field 'Bill.currency' must be an ISO-4217 currency string code.")
        if "created" not in self:
            self["created"] = now()
        try:
            self["created"] = dt_parse(str(self.get("created"))).isoformat()
        except ValueError:
            raise ValueError("Field 'Bill.created' must be an ISO-8601 datetime string.")
        if "id" not in self:
            self["id"] = uuid.uuid4()

    @property

[docs]
    def id(self):
        """
        Bill ID.
        """
        return dict.__getitem__(self, "id")


    @property

[docs]
    def user(self):
        """
        User ID.
        """
        return dict.__getitem__(self, "user")


    @property

[docs]
    def quote(self):
        """
        Quote ID.
        """
        return dict.__getitem__(self, "quote")


    @property

[docs]
    def job(self):
        """
        Job ID.
        """
        return dict.__getitem__(self, "job")


    @property

[docs]
    def created(self):
        """
        Quote creation datetime.
        """
        return self.get("created")


    @property

[docs]
    def title(self):
        """
        Quote title.
        """
        return self.get("title")


    @property

[docs]
    def description(self):
        """
        Quote description.
        """
        return self.get("description")



[docs]
    def params(self):
        # type: () -> AnyParams
        return {
            "id": self.id,
            "user": self.user,
            "quote": self.quote,
            "job": self.job,
            "price": self.price,
            "created": self.created,
            "title": self.title,
            "description": self.description,
        }



[docs]
    def json(self):
        # type: () -> JSON
        data = self.dict()
        data.update({
            "billID": self.id,
            "quoteID": self.quote,
            "jobID": self.job,
        })
        return sd.BillSchema().deserialize(self)