log_metadata

The log_metadata() function allows you to attach metadata to various ZenML entities including steps, pipeline runs, artifacts, and model versions.

Signature

def log_metadata(
    metadata: Dict[str, MetadataType],
    # Step and run parameters
    step_id: Optional[UUID] = None,
    step_name: Optional[str] = None,
    run_id_name_or_prefix: Optional[Union[UUID, str]] = None,
    # Artifact parameters
    artifact_version_id: Optional[UUID] = None,
    artifact_name: Optional[str] = None,
    artifact_version: Optional[str] = None,
    infer_artifact: bool = False,
    # Model parameters
    model_version_id: Optional[UUID] = None,
    model_name: Optional[str] = None,
    model_version: Optional[Union[ModelStages, int, str]] = None,
    infer_model: bool = False,
) -> None

Parameters

metadata

Dict[str, MetadataType]

required

Dictionary of metadata key-value pairs to log. Values can be strings, numbers, booleans, lists, or dicts.

step_id

UUID

The ID of a specific step to attach metadata to.

step_name

str

The name of a step (requires run_id_name_or_prefix).

run_id_name_or_prefix

Union[UUID, str]

The ID, name, or prefix of a pipeline run.

artifact_version_id

UUID

The ID of a specific artifact version.

artifact_name

str

The name of an artifact (requires artifact_version for external calls).

artifact_version

str

The version of the artifact.

infer_artifact

bool

default:"False"

Whether to infer the artifact from the step context (must be called inside a step).

model_version_id

UUID

The ID of a specific model version.

model_name

str

The name of a model (requires model_version).

model_version

Union[ModelStages, int, str]

The version or stage of the model.

infer_model

bool

default:"False"

Whether to infer the model from the step context (must be called inside a step with a configured model).

Examples

Log Metadata to Current Step

from zenml import step, log_metadata

@step
def training_step() -> None:
    # Train model
    accuracy = 0.95
    loss = 0.05
    
    # Log to the current step
    log_metadata({
        "accuracy": accuracy,
        "loss": loss,
        "framework": "tensorflow",
        "epochs": 100
    })

Log Metadata to Artifact Output

from zenml import step, log_metadata
import pandas as pd

@step
def create_dataset() -> pd.DataFrame:
    df = pd.DataFrame({"value": range(1000)})
    
    # Log metadata to the output artifact
    log_metadata(
        metadata={
            "num_rows": len(df),
            "num_columns": len(df.columns),
            "memory_usage": df.memory_usage(deep=True).sum()
        },
        infer_artifact=True
    )
    
    return df

Log Metadata to Specific Artifact

from zenml import step, log_metadata
from typing import Tuple, Annotated
import pandas as pd

@step
def split_data() -> Tuple[
    Annotated[pd.DataFrame, "train"],
    Annotated[pd.DataFrame, "test"],
]:
    train = pd.DataFrame({"x": range(800)})
    test = pd.DataFrame({"x": range(200)})
    
    # Log metadata to specific outputs
    log_metadata(
        metadata={"split": "train", "size": len(train)},
        artifact_name="train",
        infer_artifact=True
    )
    
    log_metadata(
        metadata={"split": "test", "size": len(test)},
        artifact_name="test",
        infer_artifact=True
    )
    
    return train, test

Log Metadata to Model

from zenml import step, log_metadata, Model

@step(model=Model(name="iris_classifier", version="1.0"))
def evaluate_model() -> float:
    accuracy = 0.96
    
    # Log metadata to the model version
    log_metadata(
        metadata={
            "test_accuracy": accuracy,
            "test_samples": 150,
            "confusion_matrix": [[50, 0, 0], [0, 48, 2], [0, 1, 49]]
        },
        infer_model=True
    )
    
    return accuracy

Log Metadata to Existing Artifact

from zenml import log_metadata

# Log metadata to a previously created artifact
log_metadata(
    metadata={
        "reviewed": True,
        "reviewer": "data_scientist_1",
        "quality_score": 9.5
    },
    artifact_name="training_data",
    artifact_version="5"
)

Log Metadata to Pipeline Run

from zenml import step, log_metadata

@step
def monitor_step() -> None:
    # Log metadata to the entire pipeline run
    log_metadata(
        metadata={
            "environment": "production",
            "triggered_by": "scheduler",
            "priority": "high"
        },
        run_id_name_or_prefix="my_pipeline-2024_01_15-12_30_45"
    )

Log Metadata to Specific Step in Run

from zenml import log_metadata

# Log metadata to a specific step in a specific run
log_metadata(
    metadata={
        "retry_count": 3,
        "error_resolved": True
    },
    step_name="data_loader",
    run_id_name_or_prefix="my_pipeline-2024_01_15"
)

Complex Metadata Types

from zenml import step, log_metadata

@step
def analysis_step() -> None:
    log_metadata({
        # Simple types
        "accuracy": 0.95,
        "model_type": "RandomForest",
        "is_production": True,
        
        # Lists
        "feature_names": ["age", "income", "education"],
        "class_labels": [0, 1, 2],
        
        # Nested structures
        "hyperparameters": {
            "n_estimators": 100,
            "max_depth": 10,
            "min_samples_split": 2
        },
        
        # Arrays/matrices (as lists)
        "confusion_matrix": [
            [45, 2, 1],
            [3, 48, 2],
            [1, 1, 47]
        ]
    })

Log Metadata to Model by Name and Version

from zenml import log_metadata
from zenml.enums import ModelStages

# Log to production model
log_metadata(
    metadata={
        "deployed_at": "2024-01-15T10:30:00Z",
        "deployment_target": "kubernetes-cluster-1",
        "replicas": 3
    },
    model_name="sentiment_analyzer",
    model_version=ModelStages.PRODUCTION
)

Batch Metadata Logging

from zenml import step, log_metadata

@step
def comprehensive_step() -> dict:
    results = {"score": 0.92}
    
    # Log multiple metadata entries
    log_metadata({"preprocessing": "completed"})
    log_metadata({"training": "completed"})
    log_metadata({"validation": "completed"})
    log_metadata({"final_score": results["score"]})
    
    return results

Metadata Types

The following Python types are supported as metadata values:

Primitives: str, int, float, bool
Collections: list, dict
None: None values are supported
Nested: Dictionaries and lists can be nested

Use Cases

Track experiment parameters - Log hyperparameters, configurations, and settings
Record performance metrics - Store accuracy, loss, and other evaluation metrics
Document data statistics - Save dataset sizes, distributions, and characteristics
Audit and compliance - Track who processed data, when, and under what conditions
Quality assurance - Mark artifacts as reviewed, validated, or approved
Deployment tracking - Record deployment information and environment details

log_artifact_metadata

Deprecated artifact metadata function

log_model_metadata

Deprecated model metadata function

get_step_context

Access step context

bulk_log_metadata

Log metadata to multiple entities

Core API

Context & Metadata

Artifacts

Tags & Organization

Utilities

Stack Components

log_metadata

Signature

Parameters

Examples

Log Metadata to Current Step

Log Metadata to Artifact Output

Log Metadata to Specific Artifact

Log Metadata to Model

Log Metadata to Existing Artifact

Log Metadata to Pipeline Run

Log Metadata to Specific Step in Run

Complex Metadata Types

Log Metadata to Model by Name and Version

Batch Metadata Logging

Metadata Types

Use Cases

log_artifact_metadata

log_model_metadata

get_step_context

bulk_log_metadata

Build docs developers (and LLMs) love

Core API

Context & Metadata

Artifacts

Tags & Organization

Utilities

Stack Components

​Signature

​Parameters

​Examples

​Log Metadata to Current Step

​Log Metadata to Artifact Output

​Log Metadata to Specific Artifact

​Log Metadata to Model

​Log Metadata to Existing Artifact

​Log Metadata to Pipeline Run

​Log Metadata to Specific Step in Run

​Complex Metadata Types

​Log Metadata to Model by Name and Version

​Batch Metadata Logging

​Metadata Types

​Use Cases

​Related

log_artifact_metadata

log_model_metadata

get_step_context

bulk_log_metadata

Build docs developers (and LLMs) love

Signature

Parameters

Examples

Log Metadata to Current Step

Log Metadata to Artifact Output

Log Metadata to Specific Artifact

Log Metadata to Model

Log Metadata to Existing Artifact

Log Metadata to Pipeline Run

Log Metadata to Specific Step in Run

Complex Metadata Types

Log Metadata to Model by Name and Version

Batch Metadata Logging

Metadata Types

Use Cases

Related