Source code for mlrun.serving.remote

# Copyright 2023 Iguazio
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import asyncio
import json
from copy import copy
from typing import Union

import aiohttp
import requests
import storey
from storey.flow import _ConcurrentJobExecution

import mlrun
import mlrun.common.schemas
import mlrun.config
import mlrun.platforms
import mlrun.utils.async_http
from mlrun.common.helpers import parse_versioned_object_uri
from mlrun.errors import err_to_str
from mlrun.utils import dict_to_json, logger

from ..config import config
from .utils import (
    _extract_input_data,
    _update_result_body,
    event_id_key,
    event_path_key,
)

default_retries = 6
default_backoff_factor = 1



[docs]
class RemoteStep(storey.SendToHttp):
    def __init__(
        self,
        url: str,
        subpath: str | None = None,
        method: str | None = None,
        headers: dict | None = None,
        url_expression: str | None = None,
        body_expression: str | None = None,
        return_json: bool = True,
        input_path: str | None = None,
        result_path: str | None = None,
        max_in_flight=None,
        retries=None,
        backoff_factor=None,
        timeout=None,
        headers_expression: str | None = None,
        **kwargs,
    ):
        """class for calling remote endpoints

        sync and async graph step implementation for request/resp to remote service (class shortcut = "$remote")
        url can be an http(s) url (e.g. `https://myservice/path`) or an mlrun function uri ([project/]name).
        alternatively the url_expression can be specified to build the url from the event (e.g. "event['url']").

        example pipeline::

            flow = function.set_topology("flow", engine="async")
            flow.to(name="step1", handler="func1")
                .to(RemoteStep(name="remote_echo", url="https://myservice/path", method="POST"))
                .to(name="laststep", handler="func2").respond()


        :param url:     http(s) url or function [project/]name to call
        :param subpath: path (which follows the url), use `$path` to use the event.path
        :param method:  The HTTP method to use for the request (e.g., "GET", "POST", "PUT", "DELETE").
                        If not provided, the step will try to use `event.method` at runtime, and if that
                        is also missing, it defaults to `"POST"`.
        :param headers: dictionary with http header values
        :param url_expression: an expression for getting the url from the event, e.g. "event['url']"
        :param body_expression: an expression for getting the request body from the event, e.g. "event['data']"
        :param return_json: indicate the returned value is json, and convert it to a py object
        :param input_path:  when specified selects the key/path in the event to use as body
                            this require that the event body will behave like a dict, example:
                            event: {"data": {"a": 5, "b": 7}}, input_path="data.b" means request body will be 7
        :param result_path: selects the key/path in the event to write the results to
                            this require that the event body will behave like a dict, example:
                            event: {"x": 5} , result_path="resp" means the returned response will be written
                            to event["y"] resulting in {"x": 5, "resp": <result>}
        :param retries:     number of retries (in exponential backoff)
        :param backoff_factor: A backoff factor in seconds to apply between attempts after the second try
        :param timeout:     How long to wait for the server to send data before giving up, float in seconds
        :param headers_expression: an expression for getting the request headers from the event, e.g. "event['headers']"
        """
        # init retry args for storey
        retries = default_retries if retries is None else retries
        super().__init__(
            None,
            None,
            input_path=input_path,
            result_path=result_path,
            max_in_flight=max_in_flight,
            retries=retries,
            backoff_factor=backoff_factor,
            **kwargs,
        )
        self.url = url
        self.url_expression = url_expression
        self.body_expression = body_expression
        self.headers_expression = headers_expression
        self.headers = headers
        self.method = method
        self.return_json = return_json
        self.subpath = subpath

        self.timeout = timeout

        self._append_event_path = False
        self._endpoint = ""
        self._session = None
        self._url_function_handler = None
        self._body_function_handler = None
        self._headers_function_handler = None


[docs]
    def post_init(self, mode="sync", **kwargs):
        self._endpoint = self.url
        if self.url and self.context:
            self._endpoint = self.context.get_remote_endpoint(self.url).strip("/")
        if self.body_expression:
            # init lambda function for calculating url from event
            self._body_function_handler = eval(
                "lambda event: " + self.body_expression, {"context": self.context}, {}
            )
        if self.url_expression:
            # init lambda function for calculating url from event
            self._url_function_handler = eval(
                "lambda event: " + self.url_expression,
                {"endpoint": self._endpoint, "context": self.context},
                {},
            )
        if self.headers_expression:
            self._headers_function_handler = eval(
                "lambda event: " + self.headers_expression,
                {"context": self.context},
                {},
            )
        elif self.subpath:
            self._append_event_path = self.subpath == "$path"
            if not self._append_event_path:
                self._endpoint = self._endpoint + "/" + self.subpath.lstrip("/")


    async def _process_event(self, event):
        # async implementation (with storey)
        body = self._get_event_or_body(event)
        method, url, headers, body, kwargs = self._generate_request(event, body)
        kwargs = kwargs or {}
        if self.timeout:
            kwargs["timeout"] = aiohttp.ClientTimeout(total=self.timeout)
        try:
            resp = await self._client_session.request(
                method, url, headers=headers, data=body, ssl=False, **kwargs
            )
            if resp.status >= 500:
                text = await resp.text()
                raise RuntimeError(f"bad http response {resp.status}: {text}")
            return resp
        except TimeoutError as exc:
            logger.error(f"http request to {url} timed out in RemoteStep {self.name}")
            raise exc

    async def _handle_completed(self, event, response):
        response_body = await response.read()
        if response.status >= 400:
            raise ValueError(
                f"For event {event}, RemoteStep {self.name} got an unexpected response "
                f"status {response.status}: {response_body}"
            )

        body = self._get_data(response_body, response.headers)

        new_event = self._user_fn_output_to_event(event, body)
        await self._do_downstream(new_event)


[docs]
    def do_event(self, event):
        # sync implementation (without storey)
        if not self._session:
            self._session = mlrun.utils.HTTPSessionWithRetry(
                self.retries,
                self.backoff_factor or mlrun.mlconf.http_retry_defaults.backoff_factor,
                retry_on_exception=False,
                retry_on_status=self.retries > 0,
                retry_on_post=True,
            )

        body = _extract_input_data(self._input_path, event.body)
        method, url, headers, body, kwargs = self._generate_request(event, body)
        try:
            resp = self._session.request(
                method,
                url,
                verify=mlrun.mlconf.httpdb.http.verify,
                headers=headers,
                data=body,
                timeout=self.timeout,
                **kwargs,
            )
        except requests.exceptions.ReadTimeout as err:
            raise requests.exceptions.ReadTimeout(
                f"http request to {url} timed out in RemoteStep {self.name}, {err_to_str(err)}"
            )
        except OSError as err:
            raise OSError(f"cannot invoke url: {url}, {err_to_str(err)}")
        if not resp.ok:
            raise RuntimeError(f"bad http response {resp.status_code}: {resp.text}")

        result = self._get_data(resp.content, resp.headers)
        event.body = _update_result_body(self._result_path, event.body, result)
        return event


    def _generate_request(self, event, body):
        method = self.method or event.method or "POST"
        if self._headers_function_handler:
            headers = self._headers_function_handler(body)
        else:
            headers = copy(self.headers) or {}

        if self._url_function_handler:
            url = self._url_function_handler(body)
        else:
            url = self._endpoint
            striped_path = event.path.lstrip("/")
            if self._append_event_path:
                url = url + "/" + striped_path
            if striped_path:
                headers[event_path_key] = event.path
        if event.id:
            headers[event_id_key] = event.id
        if method == "GET":
            body = None
        elif body is not None and not isinstance(body, str | bytes):
            if self._body_function_handler:
                body = self._body_function_handler(body)
            body = json.dumps(body)
            headers["Content-Type"] = "application/json"

        return method, url, headers, body, {}

    def _get_data(self, data, headers):
        if (
            self.return_json
            or headers.get("content-type", "").lower() == "application/json"
        ) and isinstance(data, str | bytes):
            data = json.loads(data)
        return data




[docs]
class BatchHttpRequests(_ConcurrentJobExecution):
    def __init__(
        self,
        url: str | None = None,
        subpath: str | None = None,
        method: str | None = None,
        headers: dict | None = None,
        url_expression: str | None = None,
        body_expression: str | None = None,
        return_json: bool = True,
        input_path: str | None = None,
        result_path: str | None = None,
        retries=None,
        backoff_factor=None,
        timeout=None,
        **kwargs,
    ):
        """class for calling remote endpoints in parallel

        sync and async graph step implementation for request/resp to remote service (class shortcut = "$remote")
        url can be an http(s) url (e.g. `https://myservice/path`) or an mlrun function uri ([project/]name).
        alternatively the url_expression can be specified to build the url from the event (e.g. "event['url']").

        example pipeline::

            function = mlrun.new_function("myfunc", kind="serving")
            flow = function.set_topology("flow", engine="async")
            flow.to(
                BatchHttpRequests(
                    url_expression="event['url']",
                    body_expression="event['data']",
                    method="POST",
                    input_path="req",
                    result_path="resp",
                )
            ).respond()

            server = function.to_mock_server()
            # request contains a list of elements, each with url and data
            request = [{"url": f"{base_url}/{i}", "data": i} for i in range(2)]
            resp = server.test(body={"req": request})


        :param url:     http(s) url or function [project/]name to call
        :param subpath: path (which follows the url)
        :param method:  HTTP method (GET, POST, ..), default to POST
        :param headers: dictionary with http header values
        :param url_expression: an expression for getting the url from the event, e.g. "event['url']"
        :param body_expression: an expression for getting the request body from the event, e.g. "event['data']"
        :param return_json: indicate the returned value is json, and convert it to a py object
        :param input_path:  when specified selects the key/path in the event to use as body
                            this require that the event body will behave like a dict, example:
                            event: {"data": {"a": 5, "b": 7}}, input_path="data.b" means request body will be 7
        :param result_path: selects the key/path in the event to write the results to
                            this require that the event body will behave like a dict, example:
                            event: {"x": 5} , result_path="resp" means the returned response will be written
                            to event["y"] resulting in {"x": 5, "resp": <result>}
        :param retries:     number of retries (in exponential backoff)
        :param backoff_factor: A backoff factor in seconds to apply between attempts after the second try
        :param timeout:     How long to wait for the server to send data before giving up, float in seconds
        """
        if url and url_expression:
            raise mlrun.errors.MLRunInvalidArgumentError(
                "cannot set both url and url_expression"
            )
        self.url = url
        self.url_expression = url_expression
        self.body_expression = body_expression
        self.headers = headers
        self.method = method
        self.return_json = return_json
        self.subpath = subpath
        super().__init__(input_path=input_path, result_path=result_path, **kwargs)

        self.timeout = timeout
        self.retries = retries
        self.backoff_factor = backoff_factor
        self._append_event_path = False
        self._endpoint = ""
        self._session = None
        self._url_function_handler = None
        self._body_function_handler = None
        self._request_args = {}

    def _init(self):
        super()._init()
        self._client_session = None

    async def _lazy_init(self):
        connector = aiohttp.TCPConnector()
        self._client_session = aiohttp.ClientSession(connector=connector)

    async def _cleanup(self):
        await self._client_session.close()


[docs]
    def post_init(self, mode="sync", **kwargs):
        self._endpoint = self.url
        if self.url and self.context:
            self._endpoint = self.context.get_remote_endpoint(self.url).strip("/")
        if self.body_expression:
            # init lambda function for calculating url from event
            self._body_function_handler = eval(
                "lambda event: " + self.body_expression, {}, {}
            )
        if self.url_expression:
            # init lambda function for calculating url from event
            self._url_function_handler = eval(
                "lambda event: " + self.url_expression, {}, {"endpoint": self._endpoint}
            )
        elif self.subpath:
            self._endpoint = self._endpoint + "/" + self.subpath.lstrip("/")
        if self.timeout:
            self._request_args["timeout"] = aiohttp.ClientTimeout(total=self.timeout)


    async def _process_event(self, event):
        # async implementation (with storey)
        method = self.method or event.method or "POST"
        headers = self.headers or {}
        input_list = self._get_event_or_body(event)
        is_get = method == "GET"
        is_json = False

        body_list = []
        url_list = []
        for body in input_list:
            if self._url_function_handler:
                url_list.append(self._url_function_handler(body))
            else:
                url_list.append(self._endpoint)

            if is_get:
                body = None
            elif body is not None and not isinstance(body, str | bytes):
                if self._body_function_handler:
                    body = self._body_function_handler(body)
                body = json.dumps(body)
                is_json = True
            body_list.append(body)

        if is_json:
            headers["Content-Type"] = "application/json"

        responses = []
        for url, body in zip(url_list, body_list):
            responses.append(
                asyncio.ensure_future(
                    self._submit_with_retries(method, url, headers, body)
                )
            )
        return await asyncio.gather(*responses)

    async def _process_event_with_retries(self, event):
        return await self._process_event(event)

    async def _submit(self, method, url, headers, body):
        async with self._client_session.request(
            method, url, headers=headers, data=body, ssl=False, **self._request_args
        ) as future:
            if future.status >= 500:
                text = await future.text()
                raise RuntimeError(f"bad http response {future.status}: {text}")
            return await future.read(), future.headers

    async def _submit_with_retries(self, method, url, headers, body):
        times_attempted = 0
        max_attempts = (self.retries or default_retries) + 1
        while True:
            try:
                return await self._submit(method, url, headers, body)
            except Exception as ex:
                times_attempted += 1
                attempts_left = max_attempts - times_attempted
                if self.logger:
                    self.logger.warn(
                        f"{self.name} failed to process event ({attempts_left} retries left): {ex}"
                    )
                if attempts_left <= 0:
                    raise ex
                backoff_factor = (
                    default_backoff_factor
                    if self.backoff_factor is None
                    else self.backoff_factor
                )
                backoff_value = (backoff_factor) * (2 ** (times_attempted - 1))
                backoff_value = min(self._BACKOFF_MAX, backoff_value)
                if backoff_value >= 0:
                    await asyncio.sleep(backoff_value)

    async def _handle_completed(self, event, response):
        data = []
        for body, headers in response:
            data.append(self._get_data(body, headers))

        new_event = self._user_fn_output_to_event(event, data)
        await self._do_downstream(new_event)

    def _get_data(self, data, headers):
        if (
            self.return_json
            or headers.get("content-type", "").lower() == "application/json"
        ) and isinstance(data, str | bytes):
            data = json.loads(data)
        return data




[docs]
class MLRunAPIRemoteStep(RemoteStep):
    def __init__(
        self, method: str, path: str, fill_placeholders: bool | None = None, **kwargs
    ):
        """
        Graph step implementation for calling MLRun API endpoints

        :param method:  The HTTP method to use for the request (e.g., "GET", "POST", "PUT", "DELETE").
                        If not provided, the step will try to use `event.method` at runtime, and if that
                        is also missing, it defaults to `"POST"`.
        :param path:    API path (e.g. /api/projects)
        :param fill_placeholders: if True, fill placeholders in the path using event fields (default to False)
        :param kwargs:  other arguments passed to RemoteStep
        """
        super().__init__(url="", method=method, **kwargs)
        self.rundb = None
        self.path = path
        self.fill_placeholders = fill_placeholders

    def _generate_request(self, event, body):
        method = self.method or event.method or "POST"
        kw = {
            key: value
            for key, value in (
                ("params", body.get("params")),
                ("json", body.get("json")),
            )
            if value is not None
        }

        headers = self.headers or {}
        headers.update(body.get("headers", {}))

        if self.rundb.user:
            kw["auth"] = (self.rundb.user, self.rundb.password)
        elif self.rundb.token_provider:
            token = self.rundb.token_provider.get_token()
            if token:
                # Iguazio auth doesn't support passing token through bearer, so use cookie instead
                if self.rundb.token_provider.is_iguazio_session():
                    session_cookie = f'session=j:{{"sid": "{token}"}}'
                    headers["cookie"] = session_cookie
                else:
                    if mlrun.common.schemas.HeaderNames.authorization not in headers:
                        logger.info(
                            "Adding authorization header with bearer token for MLRun API request"
                        )
                        headers.update(
                            {
                                mlrun.common.schemas.HeaderNames.authorization: (
                                    mlrun.common.schemas.AuthorizationHeaderPrefixes.bearer
                                    + token
                                )
                            }
                        )

        if mlrun.common.schemas.HeaderNames.client_version not in headers:
            headers.update(
                {
                    mlrun.common.schemas.HeaderNames.client_version: self.rundb.client_version,
                    mlrun.common.schemas.HeaderNames.python_version: self.rundb.python_version,
                    "User-Agent": f"{requests.utils.default_user_agent()} mlrun/{config.version}",
                }
            )

        url = self.url.format(**body) if self.fill_placeholders else self.url
        headers["Content-Type"] = "application/json"
        return method, url, headers, dict_to_json(body), kw


[docs]
    def post_init(self, mode="sync", **kwargs):
        super().post_init(mode=mode, **kwargs)
        self.fill_placeholders = self.fill_placeholders or False
        self.rundb = mlrun.get_run_db()
        self.url = self.rundb.get_base_api_url(self.path)





[docs]
class RemoteFunctionStep(RemoteStep):
    """
    Graph step implementation for invoking functions remotely.

    :param fn:  Either an `mlrun.runtimes.RemoteRuntime` object or
                a string URI in the form `function_name` or `project_name/function_name`.
    :param project_name:  Optional project name containing the function. If not provided,
                          the project name will be derived automatically according to the following order:

                          1. Extracted from the function URI (if specified as 'project_name/function_name')
                          2. Taken from the `project_name` parameter
                          3. Inferred from the current runtime or graph execution context
    """

    def __init__(
        self,
        fn: Union[mlrun.runtimes.RemoteRuntime, str, None] = None,
        project_name: str = "",
        **kwargs,
    ):
        super().__init__(url="", **kwargs)
        self.rundb = None
        self.fn = fn
        self.project_name = project_name


[docs]
    def post_init(self, mode="sync", **kwargs) -> None:
        self.rundb = mlrun.get_run_db()
        if not isinstance(self.fn, (mlrun.runtimes.RemoteRuntime, str)):
            raise mlrun.errors.MLRunInvalidArgumentTypeError(
                "Parameter 'fn' must be of type mlrun.runtimes.RemoteRuntime or str."
            )

        if not self.fn:
            raise mlrun.errors.MLRunRuntimeError(
                "Parameter 'fn' have to be initialized."
            )

        if isinstance(self.fn, str):
            project, uri, tag, hash_key = parse_versioned_object_uri(self.fn)

            if self.project_name and project:
                if self.project_name != project:
                    raise mlrun.errors.MLRunRuntimeError(
                        "Project name can only be set once: either in 'project_name' or in the function URI."
                    )

            project = project or self.project_name or mlrun.mlconf.active_project

            try:
                self.fn = self.rundb.get_function(
                    name=uri, project=project, tag=tag, hash_key=hash_key
                )
                if isinstance(self.fn, dict):
                    self.fn = mlrun.runtimes.RemoteRuntime.from_dict(self.fn)

            except mlrun.MLRunNotFoundError as e:
                raise e

        if not isinstance(self.fn, mlrun.runtimes.RemoteRuntime):
            raise mlrun.errors.MLRunRuntimeError(
                f"Failed reading function '{self.fn}' from DB\n"
                "Verify that the function URI is correct and that the function is stored properly."
            )

        url = self.fn.get_url()

        if not url:
            raise mlrun.errors.MLRunRuntimeError(
                f"Could not determine the function URL for '{self.fn.metadata.name}'. \n"
                "Make sure the function is deployed and reachable."
            )

        self.url = url
        super().post_init(mode=mode, **kwargs)