Source code for mlrun.hub.module

# Copyright 2025 Iguazio
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import warnings
from pathlib import Path
from typing import Union

import yaml
from deprecated import deprecated

import mlrun.common.types
import mlrun.utils
from mlrun.common.schemas.hub import HubModuleType, HubSourceType
from mlrun.run import get_object

from ..utils import extend_hub_uri_if_needed
from .base import HubAsset


[docs] class HubModule(HubAsset): ASSET_TYPE = HubSourceType.modules def __init__( self, name: str, version: str, kind: Union[HubModuleType, str], description: str | None = None, categories: list | None = None, requirements: list | None = None, local_path: Path | None = None, filename: str | None = None, example: str | None = None, url: str | None = None, **kwargs, # catch all for unused args ): super().__init__( name=name, version=version, description=description, categories=categories, requirements=requirements, local_path=local_path, filename=filename, example=example, url=url, ) self.kind = kind # TODO: Remove this in 1.13.0
[docs] @deprecated( version="1.11.0", reason="This function is deprecated and will be removed in 1.13. You can download module files by calling " "download_files() instead.", category=FutureWarning, ) def download_module_files( self, local_path: str | None = None, secrets: dict | None = None ): """ Download this hub module’s files (code file and, if available, an example notebook) to the target directory specified by `local_path` (defaults to the current working directory). This path will be used later to locate the code file when importing the module. """ self.local_path = self.verify_directory(path=local_path) source_url, _ = extend_hub_uri_if_needed( uri=self.url, asset_type=self.ASSET_TYPE, file=self.filename ) self._download_object( obj_url=source_url, target_name=self.filename, secrets=secrets ) if self.example: example_url, _ = extend_hub_uri_if_needed( uri=self.url, asset_type=self.ASSET_TYPE, file=self.example ) self._download_object( obj_url=example_url, target_name=self.example, secrets=secrets )
[docs] def download_files( self, local_path: str | None = None, download_example: bool = True, ): """ Download this hub module’s code file. :param local_path: Target directory to download the module files to. Defaults to the current working directory. This path will be used to locate the code file when importing it as a module. :param download_example: Whether to download the example notebook if available. Defaults to True. """ super().download_files( local_path=local_path, download_example=download_example, )
# TODO: Remove this in 1.13.0
[docs] @deprecated( version="1.11.0", reason="This function is deprecated and will be removed in 1.13. You can get the module source file path by" " calling get_src_file_path() instead.", category=FutureWarning, ) def get_module_file_path(self): """Get the full path to the module's code file.""" return super().get_src_file_path()
[docs] def get_hub_module( url: str, download_files: bool = True, secrets: dict | None = None, local_path: str | None = None, ) -> HubModule: """ Get a hub-module object containing metadata of the requested module. :param url: Hub module url in the format "hub://[<source>/]<item-name>[:<tag>]" :param download_files: When set to True, the module files (code file and example notebook) are downloaded :param secrets: Optional, credentials dict for DB or URL (s3, v3io, ...) :param local_path: Path to target directory for the module files. Ignored when download_files is set to False. Defaults to the current working directory. :return: HubModule object """ item_yaml_url, is_hub_uri = extend_hub_uri_if_needed( uri=url, asset_type=HubSourceType.modules, file="item.yaml" ) if not is_hub_uri: raise mlrun.errors.MLRunInvalidArgumentError("Not a valid hub URL") yaml_obj = get_object(url=item_yaml_url, secrets=secrets) item_yaml = yaml.safe_load(yaml_obj) spec = item_yaml.pop("spec", {}) hub_module = HubModule(**item_yaml, **spec, url=url) if download_files: with warnings.catch_warnings(): warnings.filterwarnings("ignore", category=FutureWarning) hub_module.download_module_files(local_path=local_path, secrets=secrets) return hub_module
[docs] def import_module( url: str, install_requirements: bool = False, secrets: dict | None = None, local_path: str | None = None, ): """ Import a module from the hub to use directly. :param url: hub module url in the format "hub://[<source>/]<item-name>[:<tag>]" :param install_requirements: when set to True, the module's requirements are installed. :param secrets: optional, credentials dict for DB or URL (s3, v3io, ...) :param local_path: Path to target directory for the module files (code and example notebook). Defaults to the current working directory. :return: the module """ hub_module: HubModule = get_hub_module( url=url, download_files=True, secrets=secrets, local_path=local_path ) if install_requirements: hub_module.install_requirements() return hub_module.module()