Model Utilities

Examples

Examples of using the Model Utilities are listed at the bottom of this page Examples.

Model Utilities for Workbench models

`cleanlab_model_local(model)`

Create a CleanlabModels instance for detecting data quality issues in a Model's training data.

Parameters:

Name	Type	Description	Default
`model`	`Model`	The Model used to create the cleanlab models	required

Returns:

Name	Type	Description
`CleanlabModels`	`CleanlabModels`	Label-quality analysis with helpers like label_issues(), epistemic_uncertainty(), and the native clean_learning()/datalab() objects.

Source code in src/workbench/utils/model_utils.py

def cleanlab_model_local(model: Model) -> CleanlabModels:
    """Create a CleanlabModels instance for detecting data quality issues in a Model's training data.

    Args:
        model (Model): The Model used to create the cleanlab models

    Returns:
        CleanlabModels: Label-quality analysis with helpers like label_issues(),
            epistemic_uncertainty(), and the native clean_learning()/datalab() objects.
    """
    from workbench.algorithms.models.cleanlab_model import CleanlabModels  # noqa: F401 (avoid circular import)
    from workbench.api import Model, FeatureSet  # noqa: F401 (avoid circular import)

    # Get Feature and Target Columns from the existing given Model
    features = model.features()
    target = model.target()
    model_type = model.model_type

    # Backtrack our FeatureSet to get the ID column
    fs = FeatureSet(model.get_input())
    id_column = fs.id_column

    # Get the full FeatureSet data
    full_df = fs.pull_dataframe()

    # Create and return the CleanlabModels instance
    return CleanlabModels(full_df, id_column, features, target, model_type=model_type)

`copy_model_artifacts(model, dst_name)`

Stage a model copy's S3 artifacts under the destination's training dir.

Copies the frozen model.tar.gz and its sibling output.tar.gz (the training job's output channel, which carries the HPO audit trail) plus the top-level training-capture files (validation_predictions.csv, shap_*) into {models_s3_path}/{dst_name}/training/. The frozen artifact lives in the copy's own dir so it's immune to the source's delete-then-create churn.

Parameters:

Name	Type	Description	Default
`model`	`Model`	The source model being copied	required
`dst_name`	`str`	Name of the destination model group	required

Returns:

Name	Type	Description
`str`	`str`	The frozen model.tar.gz S3 URL for the copy's container spec

Source code in src/workbench/utils/model_utils.py

def copy_model_artifacts(model: "Model", dst_name: str) -> str:
    """Stage a model copy's S3 artifacts under the destination's training dir.

    Copies the frozen model.tar.gz and its sibling output.tar.gz (the training job's
    output channel, which carries the HPO audit trail) plus the top-level
    training-capture files (validation_predictions.csv, shap_*) into
    {models_s3_path}/{dst_name}/training/. The frozen artifact lives in the copy's own
    dir so it's immune to the source's delete-then-create churn.

    Args:
        model (Model): The source model being copied
        dst_name (str): Name of the destination model group

    Returns:
        str: The frozen model.tar.gz S3 URL for the copy's container spec
    """
    src_url = model.model_data_url()
    dst_training_path = f"{model.models_s3_path}/{dst_name}/training"
    session = model.boto3_session

    # Freeze the artifact under the copy's own training dir, keeping output.tar.gz beside
    # it so readers that resolve it from model_data_url() (get_hpo_results) work on the copy
    src_dir = src_url.rsplit("/", 1)[0]
    output_url = f"{src_dir}/output.tar.gz"
    src_objs = [src_url]
    if wr.s3.does_object_exist(output_url, boto3_session=session):
        src_objs.append(output_url)
    wr.s3.copy_objects(
        src_objs,
        source_path=src_dir,
        target_path=dst_training_path,
        boto3_session=session,
    )

    # Carry the top-level training-capture files (skip timestamped job-output subdirs)
    prefix = model.model_training_path + "/"
    training_objs = [o for o in wr.s3.list_objects(path=prefix) if "/" not in o[len(prefix) :]]
    if training_objs:
        wr.s3.copy_objects(
            training_objs,
            source_path=model.model_training_path,
            target_path=dst_training_path,
            boto3_session=session,
        )

    return f"{dst_training_path}/model.tar.gz"

`extracted_artifact(artifact_uri)`

Download an S3 tarball and yield the temp directory it extracted into.

Yields None when the object can't be fetched — callers name a specific artifact and a bundle need not contain it (only searched models write output.tar.gz). The directory is removed on exit, so read what you need inside the with.

Parameters:

Name	Type	Description	Default
`artifact_uri`	`str`	S3 URI of a .tar.gz artifact.	required

Yields:

Type	Description
`Optional[str]`	str \| None: Path to the extracted directory, or None if the download failed.

Source code in src/workbench/utils/model_utils.py

@contextmanager
def extracted_artifact(artifact_uri: str) -> Iterator[Optional[str]]:
    """Download an S3 tarball and yield the temp directory it extracted into.

    Yields None when the object can't be fetched — callers name a specific artifact and a
    bundle need not contain it (only searched models write ``output.tar.gz``). The directory
    is removed on exit, so read what you need inside the ``with``.

    Args:
        artifact_uri (str): S3 URI of a .tar.gz artifact.

    Yields:
        str | None: Path to the extracted directory, or None if the download failed.
    """
    with tempfile.TemporaryDirectory() as tmpdir:
        local_tar_path = os.path.join(tmpdir, "artifact.tar.gz")
        try:
            wr.s3.download(path=artifact_uri, local_file=local_tar_path)
        except Exception as e:
            log.debug(f"Could not download artifact {artifact_uri}: {e}")
            yield None
            return
        safe_extract_tarfile(local_tar_path, tmpdir)
        yield tmpdir

`get_model_hyperparameters(workbench_model)`

Get the hyperparameters used to train a Workbench model.

Reads from Workbench meta (a cheap tag read). Models predating meta storage fall back to the model artifact and are backfilled into meta on first read.

Parameters:

Name	Type	Description	Default
`workbench_model`	`Any`	Workbench model object	required

Returns:

Name	Type	Description
`dict`	`Optional[dict]`	The hyperparameters used during training, or None if not found

Source code in src/workbench/utils/model_utils.py

def get_model_hyperparameters(workbench_model: Any) -> Optional[dict]:
    """Get the hyperparameters used to train a Workbench model.

    Reads from Workbench meta (a cheap tag read). Models predating meta storage
    fall back to the model artifact and are backfilled into meta on first read.

    Args:
        workbench_model: Workbench model object

    Returns:
        dict: The hyperparameters used during training, or None if not found
    """
    # Fast path: hyperparameters cached in Workbench meta (a cheap tag read)
    hyperparameters = workbench_model.workbench_meta().get("workbench_hyperparameters")
    if hyperparameters is not None:
        return hyperparameters

    # Legacy fallback: pull from the model artifact (downloads + extracts model.tar.gz)
    model_artifact_uri = workbench_model.model_data_url()
    if model_artifact_uri is None:
        log.warning(f"No model artifact found for {workbench_model.name}")
        return None

    hyperparameters = load_hyperparameters_from_s3(model_artifact_uri)

    # Backfill meta so subsequent reads take the fast path
    if hyperparameters is not None:
        workbench_model.upsert_workbench_meta({"workbench_hyperparameters": hyperparameters})

    return hyperparameters

`instance_architecture(instance_name)`

Get the architecture for the given instance name

Source code in src/workbench/utils/model_utils.py

def instance_architecture(instance_name: str) -> str:
    """Get the architecture for the given instance name"""
    info = model_instance_info()
    return info[info["Instance Name"] == instance_name]["Architecture"].values[0]

`load_category_mappings_from_s3(model_artifact_uri)`

Download and extract category mappings from a model artifact in S3.

Parameters:

Name	Type	Description	Default
`model_artifact_uri`	`str`	S3 URI of the model artifact.	required

Returns:

Name	Type	Description
`dict`	`Optional[dict]`	The loaded category mappings or None if not found.

Source code in src/workbench/utils/model_utils.py

def load_category_mappings_from_s3(model_artifact_uri: str) -> Optional[dict]:
    """
    Download and extract category mappings from a model artifact in S3.

    Args:
        model_artifact_uri (str): S3 URI of the model artifact.

    Returns:
        dict: The loaded category mappings or None if not found.
    """
    return _load_json_from_artifact(model_artifact_uri, "category_mappings.json")

`load_hyperparameters_from_s3(model_artifact_uri)`

Download and extract hyperparameters from a model artifact in S3.

Parameters:

Name	Type	Description	Default
`model_artifact_uri`	`str`	S3 URI of the model artifact (model.tar.gz).	required

Returns:

Name	Type	Description
`dict`	`Optional[dict]`	The loaded hyperparameters or None if not found.

Source code in src/workbench/utils/model_utils.py

def load_hyperparameters_from_s3(model_artifact_uri: str) -> Optional[dict]:
    """
    Download and extract hyperparameters from a model artifact in S3.

    Args:
        model_artifact_uri (str): S3 URI of the model artifact (model.tar.gz).

    Returns:
        dict: The loaded hyperparameters or None if not found.
    """
    return _load_json_from_artifact(model_artifact_uri, "hyperparameters.json")

`model_instance_info()`

Instance reference for the Model: hardware, us-east-1 on-demand price, and role.

Price per Hour is the rate for the instance's Usage — SageMaker charges a different rate for the same instance hosting an endpoint versus running a training job. The Training rows are the ladders in workbench.core.transforms.features_to_model.INSTANCE_LADDERS.

Source code in src/workbench/utils/model_utils.py

def model_instance_info() -> pd.DataFrame:
    """Instance reference for the Model: hardware, us-east-1 on-demand price, and role.

    Price per Hour is the rate for the instance's Usage — SageMaker charges a different
    rate for the same instance hosting an endpoint versus running a training job. The
    Training rows are the ladders in
    ``workbench.core.transforms.features_to_model.INSTANCE_LADDERS``.
    """
    data = [
        {
            "Instance Name": "ml.t2.medium",
            "Num CPUs": 2,
            "Num GPUs": 0,
            "Memory": 4,
            "Price per Hour": 0.06,
            "Category": "General",
            "Architecture": "x86_64",
            "Usage": "Hosting",
        },
        {
            "Instance Name": "ml.m7i.large",
            "Num CPUs": 2,
            "Num GPUs": 0,
            "Memory": 8,
            "Price per Hour": 0.12,
            "Category": "General",
            "Architecture": "x86_64",
            "Usage": "Hosting",
        },
        {
            "Instance Name": "ml.c7i.large",
            "Num CPUs": 2,
            "Num GPUs": 0,
            "Memory": 4,
            "Price per Hour": 0.11,
            "Category": "Compute",
            "Architecture": "x86_64",
            "Usage": "Hosting",
        },
        {
            "Instance Name": "ml.c7i.xlarge",
            "Num CPUs": 4,
            "Num GPUs": 0,
            "Memory": 8,
            "Price per Hour": 0.21,
            "Category": "Compute",
            "Architecture": "x86_64",
            "Usage": "Hosting",
        },
        {
            "Instance Name": "ml.c7g.large",
            "Num CPUs": 2,
            "Num GPUs": 0,
            "Memory": 4,
            "Price per Hour": 0.09,
            "Category": "Compute",
            "Architecture": "arm64",
            "Usage": "Hosting",
        },
        {
            "Instance Name": "ml.c7g.xlarge",
            "Num CPUs": 4,
            "Num GPUs": 0,
            "Memory": 8,
            "Price per Hour": 0.17,
            "Category": "Compute",
            "Architecture": "arm64",
            "Usage": "Hosting",
        },
        {
            "Instance Name": "ml.m5.xlarge",
            "Num CPUs": 4,
            "Num GPUs": 0,
            "Memory": 16,
            "Price per Hour": 0.23,
            "Category": "General",
            "Architecture": "x86_64",
            "Usage": "Training",
        },
        {
            "Instance Name": "ml.c7i.4xlarge",
            "Num CPUs": 16,
            "Num GPUs": 0,
            "Memory": 32,
            "Price per Hour": 0.86,
            "Category": "Compute",
            "Architecture": "x86_64",
            "Usage": "Training",
        },
        {
            "Instance Name": "ml.g6.2xlarge",
            "Num CPUs": 8,
            "Num GPUs": 1,
            "Memory": 32,
            "Price per Hour": 1.21,
            "Category": "GPU",  # NVIDIA L4 24GB
            "Architecture": "x86_64",
            "Usage": "Training",
        },
        {
            "Instance Name": "ml.g6.12xlarge",
            "Num CPUs": 48,
            "Num GPUs": 4,
            "Memory": 192,
            "Price per Hour": 5.61,
            "Category": "GPU",  # NVIDIA L4 24GB
            "Architecture": "x86_64",
            "Usage": "Training",
        },
        {
            "Instance Name": "ml.g5.12xlarge",
            "Num CPUs": 48,
            "Num GPUs": 4,
            "Memory": 192,
            "Price per Hour": 7.09,
            "Category": "GPU",  # NVIDIA A10G 24GB
            "Architecture": "x86_64",
            "Usage": "Training",
        },
    ]
    return pd.DataFrame(data)

`noise_model_local(model)`

Create a NoiseModel for detecting noisy/problematic samples in a Model's training data.

Parameters:

Name	Type	Description	Default
`model`	`Model`	The Model used to create the noise model	required

Returns:

Name	Type	Description
`NoiseModel`	`NoiseModel`	The noise model with precomputed noise scores for all samples

Source code in src/workbench/utils/model_utils.py

def noise_model_local(model: Model) -> NoiseModel:
    """Create a NoiseModel for detecting noisy/problematic samples in a Model's training data.

    Args:
        model (Model): The Model used to create the noise model

    Returns:
        NoiseModel: The noise model with precomputed noise scores for all samples
    """
    from workbench.algorithms.models.noise_model import NoiseModel  # noqa: F401 (avoid circular import)
    from workbench.api import Model, FeatureSet  # noqa: F401 (avoid circular import)

    # Get Feature and Target Columns from the existing given Model
    features = model.features()
    target = model.target()

    # Backtrack our FeatureSet to get the ID column
    fs = FeatureSet(model.get_input())
    id_column = fs.id_column

    # Create the NoiseModel from both the full FeatureSet and the Model training data
    full_df = fs.pull_dataframe()
    model_df = model.training_view().pull_dataframe()

    # Mark rows that are in the model
    model_ids = set(model_df[id_column])
    full_df["in_model"] = full_df[id_column].isin(model_ids)

    # Create and return the NoiseModel
    return NoiseModel(full_df, id_column, features, target)

`safe_extract_tarfile(tar_path, extract_path)`

Extract a tarball safely, using data filter if available.

The filter parameter was backported to Python 3.8+, 3.9+, 3.10.13+, 3.11+ as a security patch, but may not be present in older patch versions.

Source code in src/workbench/utils/model_utils.py

def safe_extract_tarfile(tar_path: str, extract_path: str) -> None:
    """
    Extract a tarball safely, using data filter if available.

    The filter parameter was backported to Python 3.8+, 3.9+, 3.10.13+, 3.11+
    as a security patch, but may not be present in older patch versions.
    """
    with tarfile.open(tar_path, "r:gz") as tar:
        if hasattr(tarfile, "data_filter"):
            tar.extractall(path=extract_path, filter="data")
        else:
            tar.extractall(path=extract_path)

`supported_instance_types(arch='x86_64', usage='Hosting')`

Get the supported instance types for the given architecture and usage (Hosting/Training)

Source code in src/workbench/utils/model_utils.py

def supported_instance_types(arch: str = "x86_64", usage: str = "Hosting") -> list:
    """Get the supported instance types for the given architecture and usage (Hosting/Training)"""

    info = model_instance_info()
    matches = (info["Architecture"] == arch) & (info["Usage"] == usage)
    return info[matches]["Instance Name"].tolist()

`uq_metrics(df, target_col)`

Evaluate uncertainty quantification model with essential metrics. Args: df: DataFrame with predictions and uncertainty estimates. Must contain the target column, a "prediction" column, and a "prediction_std" column (required for CRPS and median_std). Quantile columns ("q_025", "q_975", "q_05", "q_95", "q_10", "q_90", "q_25", "q_75") are used for coverage/width when present; otherwise Gaussian bounds are derived from "prediction_std". target_col: Name of the true target column in the DataFrame. Returns: Dictionary of computed metrics.

Source code in src/workbench/utils/model_utils.py

def uq_metrics(df: pd.DataFrame, target_col: str) -> Dict[str, Any]:
    """
    Evaluate uncertainty quantification model with essential metrics.
    Args:
        df: DataFrame with predictions and uncertainty estimates. Must contain the target
            column, a "prediction" column, and a "prediction_std" column (required for
            CRPS and median_std). Quantile columns ("q_025", "q_975", "q_05", "q_95",
            "q_10", "q_90", "q_25", "q_75") are used for coverage/width when present;
            otherwise Gaussian bounds are derived from "prediction_std".
        target_col: Name of the true target column in the DataFrame.
    Returns:
        Dictionary of computed metrics.
    """
    # Input Validation
    if df.empty:
        raise ValueError("Input DataFrame is empty.")
    if target_col not in df.columns:
        raise ValueError(f"Target column '{target_col}' not found in DataFrame.")
    if "prediction" not in df.columns:
        raise ValueError("Prediction column 'prediction' not found in DataFrame.")

    # Drop rows with NaN in any column the metrics depend on. UQ versions that
    # emit NaN for unscored compounds (no proximity match, etc.) would
    # otherwise poison np.median and scipy.spearmanr, which propagate NaN to
    # the entire scalar metric.
    n_total = len(df)
    candidate_cols = [
        "prediction",
        "prediction_std",
        "confidence",
        target_col,
        "q_025",
        "q_05",
        "q_10",
        "q_16",
        "q_25",
        "q_75",
        "q_84",
        "q_90",
        "q_95",
        "q_975",
    ]
    required_cols = [c for c in candidate_cols if c in df.columns]
    df = df.dropna(subset=required_cols)
    n_valid = len(df)
    if n_valid < n_total:
        log.info(f"UQ metrics: dropped {n_total - n_valid} of {n_total} rows with NaN in metric inputs")
    if n_valid == 0:
        log.warning("UQ metrics: no valid rows after dropping NaNs. Returning empty metrics.")
        return {}

    # --- Coverage and Interval Width ---
    if "q_025" in df.columns and "q_975" in df.columns:
        lower_95, upper_95 = df["q_025"], df["q_975"]
        lower_90, upper_90 = df["q_05"], df["q_95"]
        lower_80, upper_80 = df["q_10"], df["q_90"]
        lower_68 = df.get("q_16", df["q_10"])  # fallback to 80% interval
        upper_68 = df.get("q_84", df["q_90"])  # fallback to 80% interval
        lower_50, upper_50 = df["q_25"], df["q_75"]
    elif "prediction_std" in df.columns:
        lower_95 = df["prediction"] - 1.96 * df["prediction_std"]
        upper_95 = df["prediction"] + 1.96 * df["prediction_std"]
        lower_90 = df["prediction"] - 1.645 * df["prediction_std"]
        upper_90 = df["prediction"] + 1.645 * df["prediction_std"]
        lower_80 = df["prediction"] - 1.282 * df["prediction_std"]
        upper_80 = df["prediction"] + 1.282 * df["prediction_std"]
        lower_68 = df["prediction"] - 1.0 * df["prediction_std"]
        upper_68 = df["prediction"] + 1.0 * df["prediction_std"]
        lower_50 = df["prediction"] - 0.674 * df["prediction_std"]
        upper_50 = df["prediction"] + 0.674 * df["prediction_std"]
    else:
        raise ValueError(
            "Either quantile columns (q_025, q_975, q_25, q_75) or 'prediction_std' column must be present."
        )
    median_std = df["prediction_std"].median()
    coverage_95 = np.mean((df[target_col] >= lower_95) & (df[target_col] <= upper_95))
    coverage_90 = np.mean((df[target_col] >= lower_90) & (df[target_col] <= upper_90))
    coverage_80 = np.mean((df[target_col] >= lower_80) & (df[target_col] <= upper_80))
    coverage_68 = np.mean((df[target_col] >= lower_68) & (df[target_col] <= upper_68))
    median_width_95 = np.median(upper_95 - lower_95)
    median_width_90 = np.median(upper_90 - lower_90)
    median_width_80 = np.median(upper_80 - lower_80)
    median_width_50 = np.median(upper_50 - lower_50)
    median_width_68 = np.median(upper_68 - lower_68)

    # --- CRPS (measures calibration + sharpness) ---
    z = (df[target_col] - df["prediction"]) / df["prediction_std"]
    crps = df["prediction_std"] * (z * (2 * norm.cdf(z) - 1) + 2 * norm.pdf(z) - 1 / np.sqrt(np.pi))
    mean_crps = np.mean(crps)

    # --- Interval Score @ 95% (penalizes miscoverage) ---
    alpha_95 = 0.05
    is_95 = (
        (upper_95 - lower_95)
        + (2 / alpha_95) * (lower_95 - df[target_col]) * (df[target_col] < lower_95)
        + (2 / alpha_95) * (df[target_col] - upper_95) * (df[target_col] > upper_95)
    )
    mean_is_95 = np.mean(is_95)

    # --- Interval to Error Correlation ---
    abs_residuals = np.abs(df[target_col] - df["prediction"])
    width_68 = upper_68 - lower_68

    # Spearman correlation for robustness
    interval_to_error_corr = spearmanr(width_68, abs_residuals)[0]

    # --- Confidence to Error Correlation ---
    # If confidence column exists, compute correlation (should be negative: high confidence = low error)
    confidence_to_error_corr = None
    if "confidence" in df.columns:
        confidence_to_error_corr = spearmanr(df["confidence"], abs_residuals)[0]

    # Collect results
    results = {
        "coverage_68": coverage_68,
        "coverage_80": coverage_80,
        "coverage_90": coverage_90,
        "coverage_95": coverage_95,
        "median_std": median_std,
        "median_width_50": median_width_50,
        "median_width_68": median_width_68,
        "median_width_80": median_width_80,
        "median_width_90": median_width_90,
        "median_width_95": median_width_95,
        "interval_to_error_corr": interval_to_error_corr,
        "confidence_to_error_corr": confidence_to_error_corr,
        "n_samples": len(df),
    }

    print("\n=== UQ Metrics ===")
    print(f"Coverage @ 68%: {coverage_68:.3f} (target: 0.68)")
    print(f"Coverage @ 80%: {coverage_80:.3f} (target: 0.80)")
    print(f"Coverage @ 90%: {coverage_90:.3f} (target: 0.90)")
    print(f"Coverage @ 95%: {coverage_95:.3f} (target: 0.95)")
    print(f"Median Prediction StdDev: {median_std:.3f}")
    print(f"Median 50% Width: {median_width_50:.3f}")
    print(f"Median 68% Width: {median_width_68:.3f}")
    print(f"Median 80% Width: {median_width_80:.3f}")
    print(f"Median 90% Width: {median_width_90:.3f}")
    print(f"Median 95% Width: {median_width_95:.3f}")
    print(f"CRPS: {mean_crps:.3f} (lower is better)")
    print(f"Interval Score 95%: {mean_is_95:.3f} (lower is better)")
    print(f"Interval/Error Corr: {interval_to_error_corr:.3f} (higher is better, target: >0.5)")
    if confidence_to_error_corr is not None:
        print(f"Confidence/Error Corr: {confidence_to_error_corr:.3f} (lower is better, target: <-0.5)")
    print(f"Samples: {len(df)}")
    return results

`uq_model_local(model, version=None, refresh_proximity=False, radius=2, n_bits=4096)`

Load the fitted UQModel (V0, V1, or V2) from this Model's artifact.

Pairs with the existing fp_prox_model() / proximity_model() factory pattern: model = Model("my-model") rm = model.uq_model() out = rm.predict(test_df[["smiles"]], predictions, prediction_std)

Parameters:

Name	Type	Description	Default
`model`	`Model`	The Workbench Model whose artifact contains a fitted UQModel.	required
`version`	`Optional[str]`	Which UQ version to load — `"v0"` (isotonic on prediction+std), `"v1"` (proximity-augmented RF), or `"v2"` (pure applicability-domain from fingerprint neighbors). If `None`, reads `hyperparameters["uq_version"]` from the bundle and falls back to `"v0"`.	`None`
`refresh_proximity`	`bool`	V1/V2 only. If False (default), use the proximity backend that was embedded in the model artifact at training time — exact reference set used to fit the residual estimator, reproducible, no fingerprint recomputation. If True, build a fresh FingerprintProximity from the current source FeatureSet. Ignored for V0 (no proximity).	`False`
`radius`	`int`	Morgan fingerprint radius (only used for V1/V2 when refresh_proximity=True).	`2`
`n_bits`	`int`	Morgan fingerprint bit width (only used for V1/V2 when refresh_proximity=True).	`4096`

Returns:

Type	Description
`'UQModelV0 \| UQModelV1 \| UQModelV2'`	A ready-to-use UQModelV0, UQModelV1, or UQModelV2 instance.

Raises:

Type	Description
`FileNotFoundError`	If the requested version's artifact is not in the bundle.

Source code in src/workbench/utils/model_utils.py

def uq_model_local(
    model: Model,
    version: Optional[str] = None,
    refresh_proximity: bool = False,
    radius: int = 2,
    n_bits: int = 4096,
) -> "UQModelV0 | UQModelV1 | UQModelV2":  # noqa: F821
    """Load the fitted UQModel (V0, V1, or V2) from this Model's artifact.

    Pairs with the existing `fp_prox_model()` / `proximity_model()` factory pattern:
        model = Model("my-model")
        rm = model.uq_model()
        out = rm.predict(test_df[["smiles"]], predictions, prediction_std)

    Args:
        model: The Workbench Model whose artifact contains a fitted UQModel.
        version: Which UQ version to load — ``"v0"`` (isotonic on prediction+std),
            ``"v1"`` (proximity-augmented RF), or ``"v2"`` (pure applicability-domain
            from fingerprint neighbors). If ``None``, reads
            ``hyperparameters["uq_version"]`` from the bundle and falls back
            to ``"v0"``.
        refresh_proximity: V1/V2 only. If False (default), use the proximity backend
            that was embedded in the model artifact at training time — exact
            reference set used to fit the residual estimator, reproducible, no
            fingerprint recomputation. If True, build a fresh FingerprintProximity
            from the current source FeatureSet. Ignored for V0 (no proximity).
        radius: Morgan fingerprint radius (only used for V1/V2 when refresh_proximity=True).
        n_bits: Morgan fingerprint bit width (only used for V1/V2 when refresh_proximity=True).

    Returns:
        A ready-to-use UQModelV0, UQModelV1, or UQModelV2 instance.

    Raises:
        FileNotFoundError: If the requested version's artifact is not in the bundle.
    """
    from workbench.algorithms.dataframe.uq_model_v0 import UQModelV0  # noqa: F401
    from workbench.algorithms.dataframe.uq_model_v1 import UQModelV1  # noqa: F401
    from workbench.algorithms.dataframe.uq_model_v2 import UQModelV2  # noqa: F401

    model_artifact_uri = model.model_data_url()
    if model_artifact_uri is None:
        raise ValueError(f"No model artifact found for {model.name}")

    effective_version = _resolve_uq_version(model, version)
    if effective_version not in _VALID_UQ_VERSIONS:
        raise ValueError(f"Unknown UQ version '{effective_version}' (expected one of {_VALID_UQ_VERSIONS})")

    # V1/V2 share the proximity artifact; optionally build a fresh one to override
    fresh_prox = None
    if effective_version in ("v1", "v2") and refresh_proximity:
        from workbench.utils.prox_utils import fingerprint_prox_model_local

        fresh_prox = fingerprint_prox_model_local(model, radius=radius, n_bits=n_bits)

    with tempfile.TemporaryDirectory() as tmpdir:
        local_tar_path = os.path.join(tmpdir, "model.tar.gz")
        wr.s3.download(path=model_artifact_uri, local_file=local_tar_path)
        safe_extract_tarfile(local_tar_path, tmpdir)

        if effective_version == "v0":
            return UQModelV0.load(tmpdir)

        if effective_version == "v1":
            if not os.path.exists(os.path.join(tmpdir, "uq_model.joblib")):
                raise FileNotFoundError(
                    f"Model '{model.name}' does not have a fitted UQModelV1 "
                    "(expected uq_model.joblib in the model artifact)."
                )
            return UQModelV1.load(tmpdir, prox=fresh_prox)

        # v2
        if not os.path.exists(os.path.join(tmpdir, UQModelV2.METADATA_FILENAME)):
            raise FileNotFoundError(
                f"Model '{model.name}' does not have a fitted UQModelV2 "
                f"(expected {UQModelV2.METADATA_FILENAME} in the model artifact)."
            )
        return UQModelV2.load(tmpdir, prox=fresh_prox)

Examples

Feature Importance

"""Example for using some Model Utilities"""
from workbench.utils.model_utils import feature_importance

model = Model("aqsol_classification")
feature_importance(model)

Output

[('mollogp', 469.0),
 ('minabsestateindex', 277.0),
 ('peoe_vsa8', 237.0),
 ('qed', 237.0),
 ('fpdensitymorgan1', 230.0),
 ('fpdensitymorgan3', 221.0),
 ('estate_vsa4', 220.0),
 ('bcut2d_logphi', 218.0),
 ('vsa_estate5', 218.0),
 ('vsa_estate4', 209.0),

Additional Resources

Workbench API Classes: API Classes
Consulting Available: SuperCowPowers LLC