Basic Tracker - SIENTIA™ Log Libraryies

Basic

Overview

The Basic class of sientia_tracker module provides a generic tracker object with no additional requirements or parameters. It is designed and wrapped to interact with some open-source Machine Learning tracking libraries for logging experiments, models, and metrics.

`BaseTracker`

Basic Tracker object that don't have any requirements nor parameters to be used

Source code in sientia_tracker/basic.py

class BaseTracker:
    """
    Basic Tracker object that don't have any requirements nor parameters to be used
    """
    def __init__(self, tracking_uri:str, username: str = None, password: str = None)-> None:
        """
        Initialize the tracker object

        Parameters:
            tracking_uri: URI to the MLflow server
            username: Username to access the MLflow server
            password: Password to access the MLflow server

        Returns:
            None
        """

        mlflow.set_tracking_uri(tracking_uri)

        os.environ['MLFLOW_TRACKING_USERNAME'] = username
        os.environ['MLFLOW_TRACKING_PASSWORD'] = password
        # Create an MLflow client
        self.client = mlflow.tracking.MlflowClient()

    def log_model(self, sk_model: Any, artifact_path: Any, extra_pip_requirements: Any | None = None,**kwargs):
        """
        Log a model to MLflow.

        Parameters:
            sk_model: scikit-learn model to be saved
            artifact_path: name of the model
            extra_pip_requirements: additional pip requirements to be installed

        Returns:
            None
        """
        mlflow.sklearn.log_model(sk_model, artifact_path, extra_pip_requirements,**kwargs)

    def log_params(self, params: Dict[str, Any], **kwargs) -> None:
        """
        Log parameters to MLflow.

        Parameters:
            params: Dict with the parameters to log.

        Returns:
            None
        """
        mlflow.log_params(params, **kwargs)

    def log_metrics(self, params: Dict[str, float], **kwargs) -> None:
        """
        Log metrics to MLflow.

        Parameters:
            params: Dict with the metrics to log.

        Returns:
            None
        """
        mlflow.log_metrics(params, **kwargs)

    def log_artifact(self, local_path: str, artifact_path: str | None = None, **kwargs) -> None:
        """
        Log an artifact to MLflow.

        Parameters:
            local_path: Path to the file to write.
            artifact_path: If provided, the directory in artifact_uri to write to.

        Returns:
            None
        """
        mlflow.log_artifact(local_path, artifact_path, **kwargs)

    def set_project(self, project_name: str)-> None:
        """
        Check if the experiment already exists; if not, create it

        Parameters:
            project_name (str): The name of the project.

        Returns:
            None
        """
        project = mlflow.get_experiment_by_name(
            project_name)
        if project is None:
            mlflow.create_experiment(name=project_name)
            self.project_name = project_name
            print(f"Experiment {project_name} created")

        else:
            # Activate the experiment for tracking
            mlflow.set_experiment(project_name)
            self.project_name = project_name
            print(f"Experiment {project_name} already exists")

    def save_experiment(self):
        """
        Start a run in MLflow.

        Parameters:
            **kwargs: The parameters to log.

        Returns:
            None
        """
        print("Saving experiment", self.project_name)
        runs = mlflow.search_runs(experiment_names=[
            self.project_name], order_by=["start_time desc"])
        next_run_number = len(runs) + 1
        active_run = mlflow.start_run(run_name=f"{self.project_name}-{next_run_number}")
        return active_run

    def get_model_run_id(self, model_name: str, stage: str = "Production"):
        """
        Get the run_id of a model based on its name and stage.

        Parameters:
            model_name (str): The name of the model.
            stage (str): The stage of the model.

        Returns:
            str: The run_id of the model.
        """
        latest_versions = self.client.get_latest_versions(
            name=model_name, stages=[stage])
        run_id = latest_versions[0].source.split("/")
        return run_id[2]

    def get_model_experiment_id(self, model_name: str):
        """
        Get the project name associated with a model.

        Parameters:
            model_name (str): The name of the model.

        Returns:
            str: The project name.
        """
        latest_production_id = self.get_model_run_id(model_name=model_name, stage="Production")
        run_info = mlflow.get_run(latest_production_id)
        return run_info.info.experiment_id

    def get_run_name(self, run_id: str):
        """
        Get the run name associated with a run ID.

        Parameters:
            run_id (str): Run ID.

        Returns:
            str: Run name.
        """
        if run_id:
            run_info = mlflow.get_run(run_id)
            run_name = run_info.info.run_name
        else:
            run_name = None
        return run_name

`init(tracking_uri, username=None, password=None)`

Initialize the tracker object

Parameters:	`tracking_uri` (`str`) – URI to the MLflow server `username` (`str`, default: `None` ) – Username to access the MLflow server `password` (`str`, default: `None` ) – Password to access the MLflow server

Returns:	`None` – None

Source code in sientia_tracker/basic.py

def __init__(self, tracking_uri:str, username: str = None, password: str = None)-> None:
    """
    Initialize the tracker object

    Parameters:
        tracking_uri: URI to the MLflow server
        username: Username to access the MLflow server
        password: Password to access the MLflow server

    Returns:
        None
    """

    mlflow.set_tracking_uri(tracking_uri)

    os.environ['MLFLOW_TRACKING_USERNAME'] = username
    os.environ['MLFLOW_TRACKING_PASSWORD'] = password
    # Create an MLflow client
    self.client = mlflow.tracking.MlflowClient()

`get_model_experiment_id(model_name)`

Get the project name associated with a model.

Parameters:	`model_name` (`str`) – The name of the model.

Returns:	`str` – The project name.

Source code in sientia_tracker/basic.py

def get_model_experiment_id(self, model_name: str):
    """
    Get the project name associated with a model.

    Parameters:
        model_name (str): The name of the model.

    Returns:
        str: The project name.
    """
    latest_production_id = self.get_model_run_id(model_name=model_name, stage="Production")
    run_info = mlflow.get_run(latest_production_id)
    return run_info.info.experiment_id

`get_model_run_id(model_name, stage='Production')`

Get the run_id of a model based on its name and stage.

Parameters:	`model_name` (`str`) – The name of the model. `stage` (`str`, default: `'Production'` ) – The stage of the model.

Returns:	`str` – The run_id of the model.

Source code in sientia_tracker/basic.py

def get_model_run_id(self, model_name: str, stage: str = "Production"):
    """
    Get the run_id of a model based on its name and stage.

    Parameters:
        model_name (str): The name of the model.
        stage (str): The stage of the model.

    Returns:
        str: The run_id of the model.
    """
    latest_versions = self.client.get_latest_versions(
        name=model_name, stages=[stage])
    run_id = latest_versions[0].source.split("/")
    return run_id[2]

`get_run_name(run_id)`

Get the run name associated with a run ID.

Parameters:	`run_id` (`str`) – Run ID.

Returns:	`str` – Run name.

Source code in sientia_tracker/basic.py

def get_run_name(self, run_id: str):
    """
    Get the run name associated with a run ID.

    Parameters:
        run_id (str): Run ID.

    Returns:
        str: Run name.
    """
    if run_id:
        run_info = mlflow.get_run(run_id)
        run_name = run_info.info.run_name
    else:
        run_name = None
    return run_name

`log_artifact(local_path, artifact_path=None, **kwargs)`

Log an artifact to MLflow.

Parameters:	`local_path` (`str`) – Path to the file to write. `artifact_path` (`str \| None`, default: `None` ) – If provided, the directory in artifact_uri to write to.

Returns:	`None` – None

Source code in sientia_tracker/basic.py

def log_artifact(self, local_path: str, artifact_path: str | None = None, **kwargs) -> None:
    """
    Log an artifact to MLflow.

    Parameters:
        local_path: Path to the file to write.
        artifact_path: If provided, the directory in artifact_uri to write to.

    Returns:
        None
    """
    mlflow.log_artifact(local_path, artifact_path, **kwargs)

`log_metrics(params, **kwargs)`

Log metrics to MLflow.

Parameters:	`params` (`Dict[str, float]`) – Dict with the metrics to log.

Returns:	`None` – None

Source code in sientia_tracker/basic.py

def log_metrics(self, params: Dict[str, float], **kwargs) -> None:
    """
    Log metrics to MLflow.

    Parameters:
        params: Dict with the metrics to log.

    Returns:
        None
    """
    mlflow.log_metrics(params, **kwargs)

`log_model(sk_model, artifact_path, extra_pip_requirements=None, **kwargs)`

Log a model to MLflow.

Parameters:	`sk_model` (`Any`) – scikit-learn model to be saved `artifact_path` (`Any`) – name of the model `extra_pip_requirements` (`Any \| None`, default: `None` ) – additional pip requirements to be installed

Returns:	– None

Source code in sientia_tracker/basic.py

def log_model(self, sk_model: Any, artifact_path: Any, extra_pip_requirements: Any | None = None,**kwargs):
    """
    Log a model to MLflow.

    Parameters:
        sk_model: scikit-learn model to be saved
        artifact_path: name of the model
        extra_pip_requirements: additional pip requirements to be installed

    Returns:
        None
    """
    mlflow.sklearn.log_model(sk_model, artifact_path, extra_pip_requirements,**kwargs)

`log_params(params, **kwargs)`

Log parameters to MLflow.

Parameters:	`params` (`Dict[str, Any]`) – Dict with the parameters to log.

Returns:	`None` – None

Source code in sientia_tracker/basic.py

def log_params(self, params: Dict[str, Any], **kwargs) -> None:
    """
    Log parameters to MLflow.

    Parameters:
        params: Dict with the parameters to log.

    Returns:
        None
    """
    mlflow.log_params(params, **kwargs)

`save_experiment()`

Start a run in MLflow.

Parameters:	`kwargs`** – The parameters to log.

Returns:	– None

Source code in sientia_tracker/basic.py

def save_experiment(self):
    """
    Start a run in MLflow.

    Parameters:
        **kwargs: The parameters to log.

    Returns:
        None
    """
    print("Saving experiment", self.project_name)
    runs = mlflow.search_runs(experiment_names=[
        self.project_name], order_by=["start_time desc"])
    next_run_number = len(runs) + 1
    active_run = mlflow.start_run(run_name=f"{self.project_name}-{next_run_number}")
    return active_run

`set_project(project_name)`

Check if the experiment already exists; if not, create it

Parameters:	`project_name` (`str`) – The name of the project.

Returns:	`None` – None

Source code in sientia_tracker/basic.py

def set_project(self, project_name: str)-> None:
    """
    Check if the experiment already exists; if not, create it

    Parameters:
        project_name (str): The name of the project.

    Returns:
        None
    """
    project = mlflow.get_experiment_by_name(
        project_name)
    if project is None:
        mlflow.create_experiment(name=project_name)
        self.project_name = project_name
        print(f"Experiment {project_name} created")

    else:
        # Activate the experiment for tracking
        mlflow.set_experiment(project_name)
        self.project_name = project_name
        print(f"Experiment {project_name} already exists")

« Previous Next »