Source code for biom3d.preprocess

"""
Dataset preparation to fasten the training.

Steps:

- Normalization
- Expand dims and one_hot encoding
- Saving to numpy or tif file 

"""
from sys import platform
import sys
from typing import Any, Iterable, Literal, Optional 
import numpy as np
import os 
from tqdm import tqdm
import argparse
import pandas as pd

from biom3d.auto_config import auto_config, data_fingerprint
from biom3d.utils import one_hot_fast, resize_3d, save_python_config,DataHandlerFactory

#---------------------------------------------------------------------------
# Define the CSV file for KFold split


[docs]
def hold_out(df:pd.DataFrame, ratio:float=0.1, seed:int=42)->pd.DataFrame:
    """
    Randomly select a subset of elements from the first column of the DataFrame.

    This function adds a binary column `'hold_out'` to `df`, marking randomly selected elements with `1`
    and the rest with `0`, based on the specified `ratio`.

    The size of the set is len(set)*ratio.

    Parameters
    ----------
    df : pandas.DataFrame
        Input DataFrame with at least one column. Selection is based on the first column.
    ratio : float, default=0.1
        Proportion of elements to mark as held out.
    seed : int, default=42
        Random seed for reproducibility.

    Returns
    -------
    df : pandas.DataFrame
        DataFrame with an added `'hold_out'` column.
    """
    rng = np.random.default_rng(seed)
    l = np.array(df.iloc[:,0])
    
    # shuffle the list 
    permut = rng.permutation(len(l))
    inv_permut = np.argsort(permut)
    
    # split the shuffled list
    split = int(len(l)*ratio)
    indices = np.array([1]*split+[0]*(len(l)-split))
    
    # unpermut the list of indice to get back the original
    sort_indices = indices[inv_permut]
    
    # add columns
    df['hold_out'] = sort_indices
    return df



[docs]
def strat_kfold(df:pd.DataFrame, k:int=4, seed:int=43)->pd.DataFrame:
    """
    Assign each row of the DataFrame to one of `k` stratified folds.

    Stratification is done to maintain balance between hold-out and non-hold-out samples
    across the folds. Requires a `'hold_out'` column previously added with `hold_out()`.

    Parameters
    ----------
    df : pandas.DataFrame
        Input DataFrame with a `'hold_out'` column (0 or 1).
    k : int, default=4
        Number of folds.
    seed : int, default=43
        Random seed for reproducibility.

    Returns
    -------
    df : pandas.DataFrame
        DataFrame with an added `'fold'` column containing fold assignments (0 to k-1).
    """
    rng = np.random.default_rng(seed)
    l = np.array(df.iloc[:,0])
    
    holds_out = np.array(df['hold_out'])
    indices_all = np.arange(len(l))
    
    # retrieve train/test indices 
    indices_test = indices_all[holds_out==1]
    indices_train = indices_all[holds_out==0]
    
    # split the list in k folds and shuffle it 
    def split_indices(l):
        kfold_size = len(l)//k
        indices = []
        for i in range(k):
            indices += [i]*kfold_size
        # the remaining indices are randomly assigned
        if len(l[len(indices):])>0:
            for i in range(len(l[len(indices):])):
                alea = rng.integers(0,k,dtype=int)
                indices += [alea]
        indices = np.array(indices)
        assert len(indices) == len(l)
        rng.shuffle(indices) # shuffle the indices
        return indices
    
    folds_train = split_indices(indices_train)
    folds_test = split_indices(indices_test)
    
    # merge folds at the right place
    merge = np.zeros_like(l)
    merge[holds_out==1] = folds_test
    merge[holds_out==0] = folds_train
    
    # add the column to the DataFrame
    df['fold'] = merge
    return df



[docs]
def generate_kfold_csv(filenames:list[str], 
                       csv_path:str, 
                       hold_out_rate:float=0., 
                       kfold:int=5, 
                       seed:int=42
                       )->None:
    """
    Generate a CSV file that maps image filenames to cross-validation folds and hold-out flags.
    
    From a list of filenames create a CSV containing three columns:
    
    - `'filename'`: image filename,
    - `'hold_out'`: 1 for test/hold-out set, 0 otherwise,
    - `'fold'`: fold index (0 to kfold - 1).

    Parameters
    ----------
    filenames : list of str
        List of image filenames, relative to a dataset root.
    csv_path : str
        Path to the output CSV file.
    hold_out_rate : float, default=0.0
        Proportion of samples to assign to the hold-out (test) set.
    kfold : int, default=5
        Number of folds for stratified k-fold cross-validation.
    seed : int, default=42
        Random seed for reproducibility.

    Returns
    -------
    None
    """
    df = pd.DataFrame(filenames, columns=['filename'])
    df = hold_out(df, ratio=hold_out_rate, seed=seed)
    df = strat_kfold(df, k=kfold, seed=seed)
    df.to_csv(csv_path, index=False)


#---------------------------------------------------------------------------
# 3D segmentation preprocessing

[docs]
def resize_img_msk(img:np.ndarray, 
                   output_shape:tuple[int]|list[int]|np.ndarray, 
                   msk:Optional[np.ndarray]=None,
                   )->np.ndarray | tuple[np.ndarray,np.ndarray]:
    """
    Resize a 3D image and optionally its mask.

    Parameters
    ----------
    img : numpy.ndarray
        Input 3D image array to resize.
    output_shape : tuple, list or numpy.ndarray of int
        Desired output shape (Dx, Dy, Dz).
    msk : numpy.ndarray, optional
        Corresponding mask to resize.

    Returns
    -------
    new_img: numpy.ndarray
        The resized image.
    new_msk: numpy.ndarray, optional
        The resized mask, if `msk` is provided.
    """
    new_img = resize_3d(img, output_shape, order=3)
    if msk is not None:
        new_msk = resize_3d(msk, output_shape, is_msk=True, order=1)
        return new_img, new_msk
    else: 
        return new_img



[docs]
def get_resample_shape(input_shape:tuple[int]|list[int]|np.ndarray, 
                       spacing:list[float], 
                       median_spacing:list[float]
                       )->np.ndarray:
    """
    Compute the new shape of a volume after resampling based on spacing information.

    Parameters
    ----------
    input_shape : tuple, list or numpy.ndarray of int
        Shape of the input volume. Can be (C, D, H, W) or (D, H, W).
    spacing : list of float
        Original voxel spacing for each axis.
    median_spacing : list of float
        Target voxel spacing for each axis.

    Returns
    -------
    numpy.ndarray
        New shape after resampling, as integers (Dx, Dy, Dz).
    """
    input_shape = np.array(input_shape)
    spacing = np.array(spacing)
    median_spacing = np.array(median_spacing)
    if len(input_shape)==4:
        input_shape=input_shape[1:]
    return np.round(((spacing/median_spacing)[::-1]*input_shape)).astype(int)



[docs]
def sanity_check(msk:np.ndarray, num_classes:Optional[int]=None)->np.ndarray:
    """
    Sanity check for segmentation masks.

    Verifies if the mask contains valid class labels and attempts to fix common issues automatically.

    Parameters
    ----------
    msk : numpy.ndarray
        Segmentation mask. Can be 3D or 4D (if one-hot encoded).
    num_classes : int, optional
        Expected number of classes. If not provided, inferred from unique values.

    Raises
    ------
    RuntimeError
        If automatic correction is not possible due to ambiguous label values.
    AssertionError
        If `num_classes` is invalid (not an int or < 2).

    Returns
    -------
    numpy.ndarray
        Validated and possibly corrected segmentation mask.
    """
    uni = np.sort(np.unique(msk))
    if num_classes is None:
        num_classes = len(uni)
        
    assert isinstance(num_classes,int)
    assert num_classes >= 2
    
    if len(msk.shape)==4:
        if msk.shape[0]==1:
            return sanity_check(msk[0], num_classes=num_classes)
        # if we have 4 dimensions in the mask, we consider it one-hot encoded
        # and thus we perform a sanity check for each channel
        else:
            new_msk = []
            for i in range(msk.shape[0]):
                new_msk+=[sanity_check(msk[i], num_classes=2)]
            return np.array(new_msk)
            
    cls = np.arange(num_classes)
    if np.array_equal(uni,cls):
        # the mask is correctly annotated
        return msk
    else:
        # there is something wrong with the annotations
        # depending on the case we make automatic adjustments
        # or we through an error message
        print("[Warning] There is something abnormal with the annotations. Each voxel value must be in range {} but is in range {}.".format(cls, uni))
        if num_classes==2:
            uni2, counts = np.unique(msk,return_counts=True)
            thr = uni2[np.argmax(counts)]
            print("[Warning] All values equal to the most frequent value ({}) will be set to zero.".format(thr))
            # then we apply a threshold to the data
            # for instance: unique [2,127,232] becomes [0,1], 0 being 2 and 1 being 127 and 232
            return (msk != thr).astype(np.uint8)
        elif np.all(np.isin(uni, cls)):
            # then one label is missing in the current mask... but it should work
            print("[Warning] One or more labels are missing.")
            return msk
        elif len(uni)==num_classes:
            # then we re-annotate the unique values in the mask
            # for instance: unique [2,127,232] becomes [0,1,2]
            print("[Warning] Annotation are wrong in the mask, we will re-annotate the mask.")
            new_msk = np.zeros(msk.shape, dtype=msk.dtype)
            for i,c in enumerate(uni):
                new_msk[msk == c] = i
            return new_msk
        else:
            # case like [2,18,128,254] where the number of classes should be 3 are impossible to decide...
            raise RuntimeError("[Error] There is an error in the labels that could not be solved automatically.")



[docs]
def correct_mask(
    mask:np.ndarray,
    num_classes:int, # if num_classes is defined, then softmax
    is_2d:bool=False,
    standardize_dims:bool=True,
    output_dtype:np.dtype=np.uint16,
    use_one_hot:bool=False,
    remove_bg:bool=False,
    encoding_type:Literal['auto', 'label', 'binary', 'onehot']='auto',
    auto_correct:bool=True,
    binary_correction_strategy:Literal['majority_is_bg']='majority_is_bg'
):
    """
    Perform a sanity check and automatic correction on a segmentation mask.

    This function ensures consistency and correctness of segmentation masks, handling
    binary, label, or one-hot encodings. It can also automatically correct common labeling issues.
    
    This function is designed to be highly automated to reduce user friction. It makes
    assumptions about the data and prints warnings about any corrections it performs.
    Expert users can override the automatic behavior.

    Parameters
    ----------
    mask : numpy.ndarray
        The input segmentation mask.
            - Shape for 3D: (D, H, W) for label masks, or (C, D, H, W) for binary/one-hot masks.
            - Shape for 2D (if `is_2d=True`): (H, W) or (C, H, W).
        num_classes : int
            Number of target classes. Must be ≥ 2.
        is_2d : bool, default=False
            Whether the input is 2D (vs 3D). Adjusts the expected shape accordingly.
            If True, expects (H,W) for label masks or (C,H,W) for binary/one-hot masks. Defaults to False, expecting 3D data (D,H,W) or (C,D,H,W).
        standardize_dims : bool, default=True
            If True, ensures output is 4D. If False, retains input dimensionality.
        output_dtype : np.dtype, default=np.uint16
            Desired data type for the output mask.
        use_one_hot : bool, default=False
            If True and `encoding_type='label'`, converts the label mask to one-hot encoding.
        remove_bg : bool, default=False
            If `use_one_hot=True`, removes the background channel (assumed to be index 0).
        encoding_type : {'auto', 'label', 'binary', 'onehot'}, default='auto'
            - 'auto': (Default) Automatically determine the type based on mask.ndim. 3D is assumed 'label', 4D is assumed 'binary'.
            - 'label': A single-channel mask where pixel values are class indices (0, 1, 2...).
            - 'binary': A multi-channel mask where each channel is an independent binary (0/1) segmentation. Used with sigmoid activations.
            - 'onehot': A multi-channel mask where channels are mutually exclusive. Used with softmax activations.
        auto_correct : bool, default=True
            Whether to attempt automatic correction of invalid masks.
        binary_correction_strategy : {'majority_is_bg'}, default='majority_is_bg'
            Heuristic to fix binary masks with unexpected values.
            - 'majority_is_bg': Treat the most common value as background (0), others as foreground (1).

    Raises
    ------
    RuntimeError
        If mask validation fails and cannot be corrected.
    ValueError
        If `num_classes` is invalid (not an int or <2) or mask shape is incompatible with 2/3D.    
        
    Returns
    -------
    numpy.ndarray
        Corrected and standardized segmentation mask.
    """
    if not isinstance(num_classes, int) or num_classes < 2:
        raise RuntimeError(f"num_classes must be an integer >= 2, but got {num_classes}.")

    # --- 0. Pre-process for 2D data ---
    original_ndim = mask.ndim 
    processed_mask = mask.copy()
    if is_2d: 
        # print("[INFO] Processing in 2D mode.")
        if processed_mask.ndim == 2: # (H,W) -> (1,1,H,W)
            processed_mask = processed_mask[np.newaxis, np.newaxis, ...]
        elif processed_mask.ndim == 3: # (C,H,W) -> (C,1,H,W)
            processed_mask = processed_mask[:, np.newaxis, ...]
        else:
            raise RuntimeError(f"For is_2d=True, expected mask.ndim to be 2 or 3, but got {mask.ndim}.")

    # --- 1. Determine Encoding Type (if 'auto') ---
    if encoding_type == 'auto':
        if processed_mask.ndim == 3:
            encoding_type = 'label'
            # print(f"[INFO] Auto-detected 3D mask. Assuming 'label' encoding.")
        elif processed_mask.ndim == 4:
            if processed_mask.shape[0] == 1:
                # Squeeze to label map
                encoding_type = 'label'
                processed_mask = processed_mask[0] # (1,D,H,W) -> (D,H,W)
            else:
                # For most cases, multi-channel is usually independent binary masks
                encoding_type = 'binary'
                # print(f"[INFO] Auto-detected 4D mask. Assuming 'binary' encoding (for sigmoid).")
        else:
            raise RuntimeError(f"Unsupported mask dimension: {processed_mask.ndim}. Shape: {processed_mask.shape}")

    # --- 2. Process based on Encoding Type ---
    # --- Case A: Label Mask (e.g., [0, 1, 2, ...]) ---
    if encoding_type == 'label':
        if processed_mask.ndim != 3:
            raise RuntimeError(f"A 'label' mask must be 3D, but got shape {processed_mask.shape}")
        
        uni = np.unique(processed_mask)
        expected_labels = np.arange(num_classes)
        
        # Check if the labels are a subset of what's expected
        is_valid = np.all(np.isin(uni, expected_labels))

        if not is_valid:
            # --- Correction Logic for Label Masks ---
            print(f"[WARNING] Invalid labels found in mask. Expected subset of {expected_labels}, but found {uni}.")
            if not auto_correct:
                raise RuntimeError("Mask is invalid and auto_correct is False.")
                
            
            
            # Heuristic 1: Right number of classes, but wrong values (e.g., [10, 20, 30] for num_classes=3)
            if len(uni) == num_classes:
                print(f"[WARNING] Remapping labels: {uni} -> {expected_labels}")
                uni, inv = np.unique(processed_mask, return_inverse=True)
                expected_labels = np.arange(num_classes, dtype=np.int64)
                processed_mask = expected_labels[inv].reshape(processed_mask.shape)

            # Heuristic 2: Binary case with wrong labels (e.g., [-1, 10, 255])
            elif num_classes == 2:
                print("[INFO] Attempting binary correction for label mask.")
                if binary_correction_strategy == 'majority_is_bg':
                    counts = np.bincount(processed_mask.ravel())
                    thr = np.argmax(counts)
                    print(f"[WARNING] Heuristic 'majority_is_bg': Setting most frequent value ({thr}) to 0, others to 1.")
                    processed_mask = (processed_mask != thr)
                # Add other strategies here if needed
                else:
                    raise RuntimeError(f"Unknown binary_correction_strategy: {binary_correction_strategy}")
                
            else:
                print("[ERROR] Cannot solve ambiguity. The number of unique labels "
                    f"({len(uni)}) does not match num_classes ({num_classes}).")
                raise RuntimeError("Unrecoverable error in mask labels.")

        # After processing, ensure the label mask has a channel dimension for standardization
        if processed_mask.ndim == 3:
            if use_one_hot:
                processed_mask = one_hot_fast(processed_mask, num_classes, mapping_mode='remap')
                if remove_bg: processed_mask = processed_mask[1:]
            else:
                processed_mask = processed_mask[np.newaxis, ...] # (D,H,W) -> (1,D,H,W) or (1,H,W) to (1,1,H,W)

    # --- Case B: Binary Mask (for Sigmoid) ---
    elif encoding_type == 'binary':
        if processed_mask.ndim != 4:
            raise RuntimeError(f"A 'binary' mask must be 4D (C,D,H,W), but got shape {processed_mask.shape}")
        
        # print(f"[INFO] Validating {processed_mask.shape[0]} channels of binary mask...")
        is_perfect = True
        for i, channel in enumerate(processed_mask):
            uni = np.unique(channel)
            # A channel is valid if it only contains 0 and/or 1.
            if not np.all(np.isin(uni, [0, 1])):
                is_perfect = False
                print(f"[WARNING] Channel {i} is not binary. Found values: {uni}.")
                if not auto_correct:
                    raise RuntimeError(f"Channel {i} is invalid and auto_correct is False.")
                
                # Apply the same binary correction heuristic per-channel
                print(f"[INFO] Applying correction to channel {i}.")
                if binary_correction_strategy == 'majority_is_bg':
                    counts = np.bincount(channel.ravel())
                    thr = np.argmax(counts)
                    print(f"[WARNING] Channel {i}: Setting most frequent value ({thr}) to 0, others to 1.")
                    processed_mask[i] = (channel != thr)
                else:
                    raise RuntimeError(f"Unknown binary_correction_strategy: {binary_correction_strategy}")
        
        if is_perfect: print("[INFO] All binary channels are valid.")

    # --- Case C: One-Hot Mask (for Softmax) ---
    elif encoding_type == 'onehot':
        if processed_mask.ndim != 4:
            raise RuntimeError(f"A 'onehot' mask must be 4D (C,D,H,W), but got shape {processed_mask.shape}")
        if processed_mask.shape[0] != num_classes:
            raise RuntimeError(f"One-hot mask has {processed_mask.shape[0]} channels, but num_classes is {num_classes}.")
        
        # A one-hot mask must sum to 1 along the channel axis and contain only 0s and 1s
        is_binary = np.all((processed_mask == 0) | (processed_mask == 1))
        sums_are_one = np.all(np.sum(processed_mask, axis=0) == 1)

        if not (is_binary and sums_are_one):
            # Correction for broken one-hot masks is extremely ambiguous. Best to fail.
            print("[ERROR] Mask failed one-hot validation. is_binary:", is_binary, "sums_are_one:", sums_are_one)
            raise RuntimeError("Invalid one-hot mask. Correction is not supported.")
            
    else:
        raise RuntimeError(f"Invalid encoding_type specified: {encoding_type}")

    # --- 3. Post-process to restore original dimensionality --- 
    if  not standardize_dims and not use_one_hot:
        print("[INFO] Restoring original dimensions.")
        # Squeeze back down to original ndim
        while processed_mask.ndim > original_ndim:
            # Squeeze the first axis that has size 1
            squeezable_axes = [i for i, s in enumerate(processed_mask.shape) if s == 1]
            if not squeezable_axes: break
            processed_mask = np.squeeze(processed_mask, axis=squeezable_axes[0])

    return processed_mask.astype(output_dtype)



[docs]
def standardize_img_dims(img:np.ndarray, num_channels:int, channel_axis:int, is_2d:bool)->np.ndarray:
    """
    Standardizes an image to 4D format: (C, D, H, W) for 3D, or (C, 1, H, W) for 2D.

    This function ensures compatibility with the rest of the pipeline. If there is an incoherency between channel_axis and value and said value is unique, it will fix it.
    E.g: (8,32,32,1) with channel_axis=0 and num_channels = 1 -> (1,8,32,32)

    Parameters
    ----------
    img : numpy.ndarray
        Input image array. Expected shape:
            - 2D image: (H, W) or (C, H, W)
            - 3D image: (D, H, W) or (C, D, H, W)
    num_channels : int
        Expected number of channels after formatting.
    channel_axis : int
        Axis where the channel is located in the input image (before standardization).
        Only used if `img` has 4 dimensions.
    is_2d : bool
        Whether the input is 2D (vs 3D).

    Raises
    ------
    ValueError
        If the input shape is incompatible  with 2/3D or if the number of channels does not match.

    Returns
    -------
    img : numpy.ndarray
        Standardized image with shape:
            - 2D mode: (C, 1, H, W)
            - 3D mode: (C, D, H, W)
    original_shape : tuple
        Original shape of the input image.
    """
    original_shape = img.shape
    
    if is_2d:
        if img.ndim == 2: # (H,W) -> (1,1,H,W)
            img = img[np.newaxis, np.newaxis, ...]
        elif img.ndim == 3: # (C,H,W) -> (C,1,H,W)
            img = img[:, np.newaxis, ...]
        else:
            raise ValueError(f"For 2D, expected 2 or 3 dims, but got {img.ndim}")
    else: # 3D Data
        if img.ndim == 3: # (D,H,W) -> (1,D,H,W)
            img = img[np.newaxis, ...]
        elif img.ndim == 4: # (C,D,H,W) or other order
            # If channel axis is not first, move it.
            if channel_axis != 0:
                img = np.swapaxes(img, 0, channel_axis)
        else:
            raise ValueError(f"For 3D, expected 3 or 4 dims, but got {img.ndim}")
    
    # Final check
    if img.shape[0] != num_channels and img.shape.count(num_channels) != 1:
        raise ValueError(f"Image has {img.shape[0]} channels but expected {num_channels}.")
    elif img.shape[0] != num_channels and img.shape.count(num_channels) == 1:
        # Heuristic to save the day in case of incorrect channel axis and 4D (for 3D) or 3D (for 2D) image
        print("[WARNING] The channels where not found at channel axis, but we found a dimension with same size and moved it at first dimension.\n" \
        f"Image shape : '{img.shape}'")
        img=np.moveaxis(img,img.shape.index(num_channels),0)
        
    return img, original_shape



[docs]
def seg_preprocessor(
    img:np.ndarray, 
    img_meta:dict[str,Any],
    num_classes:int,
    msk:np.ndarray=None,
    use_one_hot:bool = False,
    remove_bg:bool = False, 
    median_spacing:list[float]|np.ndarray=[],
    clipping_bounds:list[float]|tuple[float,float]=[],
    intensity_moments:list[float]|tuple[float,float]=[],
    channel_axis:int=0,
    num_channels:int=1,
    seed:int = 42,
    is_2d:bool=False,
    )->tuple[np.ndarray,np.ndarray,dict[int,list[int]]]|tuple[np.ndarray,dict[str,Any]]:
    """
    Perform a full preprocessing pipeline for segmentation images and masks.

    This function orchestrates a series of steps:

    1. Standardizes image and mask dimensions.
    2. Validates and corrects the mask using robust heuristics.
    3. Optionally one-hot encodes the mask.
    4. Applies intensity transformations (clipping, normalization).
    5. Resamples the data to a target spacing.
    6. Computes foreground coordinates for patch sampling.
    
    Parameters
    ----------
    img : numpy.ndarray
        The input image array. Can be 2D or 3D, with or without channel dimension.
    img_meta : dict of str to any
        Dictionary containing image metadata, including the `spacing` field.
    num_classes : int
        Number of segmentation classes. Required if `msk` is provided.
    msk : numpy.ndarray, optional
        Segmentation mask corresponding to the image. Can be 2D or 3D.
    use_one_hot : bool, default=False
        If True, the mask will be converted to one-hot encoding.
    remove_bg : bool, default=False
        If True and `use_one_hot` is True, the background channel (0) is removed.
    median_spacing : list or numpy.ndarray of float, optional
        Target spacing for resampling. If empty, resampling is skipped.
    clipping_bounds : list or tuple of float, optional
        Tuple (min, max) to clip intensity values. If empty, no clipping is applied.
    intensity_moments : list or tuple of float, optional
        Tuple (mean, std) for intensity normalization. If empty, stats are computed from image.
    channel_axis : int, default=0
        Index of the channel axis in the input image.
    num_channels : int, default=1
        Expected number of image channels after standardization.
    seed : int, default=42
        Random seed for reproducibility in foreground sampling.
    is_2d : bool, default=False
        If True, assumes the image and mask are 2D rather than 3D.

    Raises
    ------
    RuntimeError
        If the mask format is invalid and cannot be corrected.
    ValueError
        If input dimensions are inconsistent with expected format.    
        
    Returns
    -------
    If `msk` is provided, returns `(img, msk, fg)`:
        - `img`: numpy.ndarray
            Preprocessed image.
        - `msk`:ndarray
            Preprocessed segmentation mask.
        - `fg`:dict mapping class index -> array of sampled voxel coordinates
    If `msk` is None, returns `(img, img_meta)`:
        - `img`: numpy.ndarray
            Preprocessed image
        - `img_meta`: 
            Original metadata, with added `original_shape`

    Notes
    -----
    - Foreground sampling is capped at 10,000 voxels per class.
    - Designed for use in biology and medical image segmentation pipelines.
    """
    do_msk = msk is not None
    spacing = img_meta.get('spacing', None) 

    # Standardize Image and Mask Dimensions and Correct Mask
    img, original_shape = standardize_img_dims(img, num_channels, channel_axis, is_2d)

    if do_msk:
        msk = correct_mask(
            msk,
            num_classes,
            is_2d=is_2d,
            use_one_hot=use_one_hot,
            remove_bg=remove_bg,
            output_dtype=np.uint16,
            auto_correct=True,
            )

    # At this point, both img and msk are guaranteed to be 4D tensors
    assert img.ndim == 4
    if do_msk: assert msk.ndim == 4

    # Intensity Transformations
    if clipping_bounds is not None and len(clipping_bounds) == 2:
        img = np.clip(img, clipping_bounds[0], clipping_bounds[1])
    
    if intensity_moments is not None and len(intensity_moments) > 0:
        mean, std = intensity_moments
        img = (img - mean) / (std + 1e-8) # Add epsilon for safety
    else:
        img = (img - img.mean()) / (img.std() + 1e-8)
    
        # enhance contrast
        # img = exposure.equalize_hist(img)

        # range image in [-1, 1]
        # img = (img - img.min())/(img.max()-img.min()) * 2 - 1

    # Resample the image and mask if needed
    if (median_spacing is not None and
        isinstance(median_spacing, (list, tuple, np.ndarray)) and
        np.asarray(median_spacing).size > 0 and
        spacing is not None and
        isinstance(spacing, (list, tuple, np.ndarray)) and
        np.asarray(spacing).size > 0):
        output_shape = get_resample_shape(img.shape, spacing, median_spacing)
        if do_msk:
            img, msk = resize_img_msk(img, msk=msk, output_shape=output_shape)
        else:
            img = resize_3d(img, output_shape)

    # Cast image type
    img = img.astype(np.float32)
    
    # Foreground Computation
    if do_msk:
        fg = {}
        rng = np.random.default_rng(seed)
        
        # Determine the class indices to iterate over
        if use_one_hot:
            # After `remove_bg`, channels correspond to classes [1, 2, ...]
            # or [0, 1, ...] if bg was kept.
            start_class_idx = 1 if remove_bg else 0
            num_fg_channels = msk.shape[0]
            class_indices = range(start_class_idx, start_class_idx + num_fg_channels)
            channel_indices = range(num_fg_channels)
        else:
            # For label masks, we sample foreground classes (typically 1 and up)
            start_class_idx = 1
            class_indices = range(start_class_idx, num_classes)
            channel_indices = [0] * len(class_indices) # Always use the first channel

        for class_idx, channel_idx in zip(class_indices, channel_indices):
            if use_one_hot:
                # `channel_idx` directly corresponds to the channel to search in
                coords = np.argwhere(msk[channel_idx] == 1)
            else:
                # For label mask, search for `class_idx` in the single channel `msk[0]`
                coords = np.argwhere(msk[0] == class_idx)

            if len(coords) > 0:
                num_samples = min(len(coords), 10000)
                sampled_indices = rng.choice(len(coords), size=num_samples, replace=False)
                fg[class_idx] = coords[sampled_indices, :]
            else:
                fg[class_idx] = []

        if not fg or all(len(v) == 0 for v in fg.values()):
            print("[Warning] Empty foreground found for all classes!")

    # 7. Return
    if do_msk:
        return img, msk, fg
    else:
        img_meta["original_shape"] = original_shape
        return img, img_meta


#---------------------------------------------------------------------------
# 3D segmentation preprocessing
# Nifti convertion (Medical segmentation decathlon)
# normalization: z-score
# resampling
# intensity normalization
# one_hot encoding

[docs]
class Preprocessing:
    """
    Preprocessing pipeline for 2D or 3D medical segmentation datasets.

    Handles preprocessing of medical images and masks including:

    - File conversion (e.g., NIfTI to NumPy or TIFF)
    - Z-score normalization and intensity clipping
    - Resampling to median voxel spacing
    - One-hot encoding of labels
    - Optional background removal
    - Optional splitting of single image datasets
    - K-Fold CSV generation

    Usage:
    Instantiate this class with all required parameters, then call `run()` to start preprocessing.

    :ivar str img_path: Path to the collection containing input images.
    :ivar str msk_path: Path to the collection containing input masks. (can be None).
    :ivar DataHandler handler: DataHandler used to load and save images.
    :ivar str img_outpath: Output path for processed images.
    :ivar str msk_outpath: Output path for processed masks.
    :ivar str fg_outpath: Output path for foreground masks (used in training).
    :ivar int num_classes: Number of classes in the segmentation masks.
    :ivar bool use_one_hot: Whether to one-hot encode the labels.
    :ivar bool remove_bg: Whether to remove the background class in the label.
    :ivar list median_size: Median shape of the dataset (used to detect channel axis).
    :ivar list median_spacing: Median voxel spacing of the dataset.
    :ivar list clipping_bounds: Intensity clipping bounds [p0.5, p99.5] for normalization.
    :ivar list intensity_moments: Mean and std intensity values for normalization.
    :ivar bool use_tif: If True, save outputs as `.tif` instead of `.npy`.
    :ivar float split_rate_for_single_img: Portion used to split a single image into train/val.
    :ivar int num_kfolds: Number of folds to use for cross-validation.
    :ivar bool is_2d: Whether the input data is 2D instead of 3D.
    :ivar int num_channels: Number of channels in the images (inferred from median size).
    :ivar int channel_axis: Axis corresponding to channel dimension.
    :ivar int img_len: Total number of images (ie: Size of the dataset).
    :ivar str csv_path: Path to the CSV file used for K-Fold or holdout splitting.
    """


[docs]
    def __init__(
        self,
        img_path:str,
        img_outpath:Optional[str] = None,
        msk_path:Optional[str] = None, # if None, only images are preprocesses not the masks
        msk_outpath:Optional[str] = None,
        fg_outpath:Optional[str] = None, # foreground location, eventually used by the dataloader
        num_classes:Optional[int] = None, # just for debug when empty masks are provided
        use_one_hot:bool = False,
        remove_bg:bool = False, # keep the background in labels 
        median_size:Iterable[int] = [],
        median_spacing:list[float]=[],
        clipping_bounds:list[float]=[],
        intensity_moments:list[float]=[],
        use_tif:bool=False, # use tif instead of npy 
        split_rate_for_single_img:float=0.25,
        num_kfolds:int=5,
        is_2d:bool=False,
        ):
        """
        Initialize the Preprocessing class.

        Parameters
        ----------
        img_path : str
            Path to the collection containing input images.
        img_outpath : str, optional
            Path to the collection to save the preprocessed images.
        msk_path : str, optional
            Path to the collection containing input masks.
        msk_outpath : str, optional
            Path to the collection to save the preprocessed masks.
        fg_outpath : str, optional
            Path to the collection to save the foreground mask.
        num_classes : int, optional
            Number of classes in the masks (including background).
        use_one_hot : bool, default=False
            Whether to one-hot encode the mask labels.
        remove_bg : bool, default=False
            Whether to remove the background class in the masks.
        median_size : list of int, optional
            Median shape of the dataset (used to infer channel axis).
        median_spacing : list of float, optional
            Median voxel spacing of the dataset.
        clipping_bounds : list of float, optional
            Intensity clipping bounds [p0.5, p99.5] for normalization.
        intensity_moments : list of float, optional
            Mean and std intensity values for normalization.
        use_tif : bool, default=False
            If True, save preprocessed outputs as TIFF instead of NumPy.
        split_rate_for_single_img : float, default=0.25
            Split ratio for single image dataset (used for train/val split).
        num_kfolds : int, default=5
            Number of folds to generate for K-Fold validation.
        is_2d : bool, default=False
            Whether the dataset is 2D (True) or 3D (False).
        """
        self.img_path=img_path
        self.msk_path=msk_path
        self.handler = DataHandlerFactory.get(
            self.img_path,
            preprocess=True,
            output=img_outpath,
            msk_path = self.msk_path,
            img_outpath = img_outpath,
            msk_outpath = msk_outpath,
            fg_outpath = fg_outpath,
            use_tif=use_tif,
        )


        # create csv along with the img folder
        self.csv_path = os.path.join(os.path.dirname(img_path), 'folds.csv')

        self.num_classes = num_classes

        self.remove_bg = remove_bg

        # median size serves to determine the number of channel
        # and the channel axis
        self.median_size = np.array(median_size)

        self.num_channels = 1
        self.channel_axis = 0
        self.img_outpath, self.msk_outpath, self.fg_outpath = self.handler.get_output()

        # if the 3D image has 4 dimensions then there is a channel dimension.
        if len(self.median_size)==4 or (is_2d and len(self.median_size)==3):
            # the channel dimension is consider to be the smallest dimension
            # this could cause problem in case where there are more z than c for instance...
            self.num_channels = np.min(median_size)
            self.channel_axis = np.argmin(self.median_size)
            if self.channel_axis != 0:
                print("[Warning] 4 dimensions detected and channel axis is {}. All image dimensions will be swapped.".format(self.channel_axis))
                self.median_size[[0,self.channel_axis]] = self.median_size[[self.channel_axis,0]]
            self.median_size = self.median_size[1:]
        # Add an extra dimension to simulate the D axis
        if is_2d:
            self.median_size = (1, *self.median_size)


        self.median_spacing = np.array(median_spacing)
        self.clipping_bounds = np.array(clipping_bounds)
        self.intensity_moments = intensity_moments
        self.use_tif = use_tif

        self.split_rate_for_single_img = split_rate_for_single_img

        self.use_one_hot = use_one_hot

        self.img_len = len(self.handler)
        self.num_kfolds = num_kfolds
        if self.num_kfolds * 2 > self.img_len:
            self.num_kfolds = max(self.img_len // 2, 2)
            print("[Warning] The number of images {} is smaller than twice the number of folds {}. The number of folds will be reduced to {}.".format(self.img_len, num_kfolds * 2, self.num_kfolds))
        
        # If the image is 2d:
        self.is_2d = is_2d


    def _split_single(self)->dict[str,Any]:
        """
        Split a single image/mask pair into two parts: training and validation.

        If the dataset contains only one image and one mask, this method splits 
        both into two sub-volumes along their largest dimension. The first sub-volume 
        is used for validation and the second for training. New images and masks 
        are saved with filenames prefixed by `0` (validation) and `1` (training).

        Returns
        -------
        metadata : dict
            Metadata from the original image (e.g., affine, spacing).
        """
        # read image and mask
        img, metadata = self.handler.load(self.handler.images[0])
        msk, _ = self.handler.load(self.handler.masks[0])

        # determine the slicing indices to crop an image along its maximum dimension
        idx = lambda start,end,shape: tuple(slice(s) if s!=max(shape) else slice(start,end) for s in shape)

        # slicing indices of the image
        # validation is cropped along its largest dimension in the interval [0, self.split_rate_for_single_img*largest_dim]
        # training is cropped along its largest dimension in the interval [self.split_rate_for_single_img*largest_dim, largest_dim]
        s = max(img.shape)
        val_img_idx = idx(start=0, end=int(np.floor(self.split_rate_for_single_img*s)), shape=img.shape)
        train_img_idx = idx(start=int(np.floor(self.split_rate_for_single_img*s)), end=s, shape=img.shape)

        # idem for the mask indices
        s = max(msk.shape)
        val_msk_idx = idx(start=0, end=int(np.floor(self.split_rate_for_single_img*s)), shape=msk.shape)
        train_msk_idx = idx(start=int(np.floor(self.split_rate_for_single_img*s)), end=s, shape=msk.shape)

        # crop the images and masks
        val_img = img[val_img_idx]
        train_img = img[train_img_idx]
        val_msk = msk[val_msk_idx]
        train_msk = msk[train_msk_idx]

        # save the images and masks 
        # validation names start with a 0
        # training names start with a 1
        handler_tmp = self.handler

        # validation
        val_img_path = self.handler.insert_prefix_to_name(self.handler.images[0],'0')
        handler_tmp.save(val_img_path,val_img,"img")
        val_msk_path = self.handler.insert_prefix_to_name(self.handler.masks[0],'0')
        handler_tmp.save(val_msk_path,val_msk,"msk")

        train_img_path = self.handler.insert_prefix_to_name(self.handler.images[0],'1')
        handler_tmp.save(train_img_path,train_img,"img")
        train_msk_path = self.handler.insert_prefix_to_name(self.handler.masks[0],'1')
        handler_tmp.save(train_msk_path,train_msk,"msk")

        
        images,masks,fg = handler_tmp.get_output()
        self.handler = DataHandlerFactory.get(
            images,
            preprocess=True,
            output=images,
            msk_path = masks,
            img_outpath = images,
            msk_outpath = masks,
            fg_outpath = fg,
            use_tif=self.use_tif,
        )
        


        # generate the csv file
        df = pd.DataFrame([train_img_path, val_img_path], columns=['filename'])
        df['hold_out'] = [0,0]
        df['fold'] = [1,0]
        df.to_csv(self.csv_path, index=False)
        return metadata
    

[docs]
    def run(self, debug:bool=False)->None:
        """
        Execute the full preprocessing pipeline.

        This method processes all images and masks in the dataset by:

        - Resampling to the target spacing
        - Intensity clipping
        - Z-score normalization
        - Optional one-hot encoding of masks
        - Saving preprocessed data to disk
        - Creating K-fold CSV split file

        Parameters
        ----------
        debug : bool, default=False
            If True, prints filenames during preprocessing instead of using tqdm progress bar.

        Returns
        -------
        None
        """
        print("Preprocessing...")
        # if there is only a single image/mask, then split them both in two portions
        image_was_split = False
        if self.img_len==1 and self.msk_path is not None:
            print("Single image found per folder. Split the images...")
            split_meta = self._split_single()
            image_was_split = True
        
        if debug: ran = self.handler
        else: ran = tqdm(self.handler,file=sys.stdout)
        for i,m,_ in ran:
            # print image name if debug mode
            if debug: 
                print("[{}/{}] Preprocessing:{}".format(self.handler._image_index,len(self.handler),i))

            img,img_meta = self.handler.load(i)
            if self.msk_path is not None:
                msk, _ = self.handler.load(m)
                img, msk, fg = seg_preprocessor(
                    img                 =img, 
                    img_meta            =img_meta if not image_was_split else split_meta,
                    msk                 =msk,
                    num_classes         =self.num_classes,
                    use_one_hot         =self.use_one_hot,
                    remove_bg           =self.remove_bg, 
                    median_spacing      =self.median_spacing,
                    clipping_bounds     =self.clipping_bounds,
                    intensity_moments   =self.intensity_moments,
                    channel_axis        =self.channel_axis,
                    num_channels        =self.num_channels,
                    is_2d               =self.is_2d
                    )
            else:
                img, _ = seg_preprocessor(
                    img                 =img, 
                    img_meta            =img_meta,
                    num_classes         =self.num_classes,
                    median_spacing      =self.median_spacing,
                    clipping_bounds     =self.clipping_bounds,
                    intensity_moments   =self.intensity_moments,
                    channel_axis        =self.channel_axis,
                    num_channels        =self.num_channels,
                    is_2d               =self.is_2d,
                    )

            # sanity check to be sure that all images have the save number of channel
            s = img.shape
            if len(s)==4: # only for images with 4 dimensionalities
                if i==0: self.num_channels = s[0]
                else: assert len(s)==4 and self.num_channels==s[0], "[Error] Not all images have {} channels. Problematic image: {}".format(self.num_channels, i)

            # save image
            # If image was split, it means we already have the original image in the output and we need to overwrite them with their preprocessed version
            self.handler.save(i,img,"img",overwrite=image_was_split)

            # save mask
            if self.msk_outpath is not None: 
                self.handler.save(m,msk,"msk",overwrite=image_was_split)
                self.handler.save(m,fg,"fg")

        # create csv file
        filenames = self.handler.extract_inner_path(self.handler.images)
        if not image_was_split:
            generate_kfold_csv(filenames, self.csv_path, kfold=self.num_kfolds)

        print("Done preprocessing!")



#---------------------------------------------------------------------------


[docs]
def auto_config_preprocess(
        img_path:str, 
        msk_path:str, 
        num_classes:int, 
        config_dir:str, 
        base_config:str, 
        img_outpath:Optional[str]=None,
        msk_outpath:Optional[str]=None,
        use_one_hot:bool=False,
        ct_norm:bool=False,
        remove_bg:bool=False, 
        use_tif:bool=False,
        desc:str="unet", 
        max_dim:int=128,
        num_epochs:int=1000,
        num_workers:int=6,
        skip_preprocessing:bool=False,
        no_auto_config:bool=False,
        logs_dir:str='logs/',
        print_param:bool=False,
        debug:bool=False,
        is_2d:bool=False,
        ):
    """
    Preprocess medical segmentation data and auto-generate a training configuration.

    This helper function performs the following steps:
    
    - Computes dataset fingerprint (median shape, spacing, intensity stats).
    - Runs the preprocessing pipeline on the data (resampling, normalization, one-hot encoding, etc.).
    - Automatically determines optimal model parameters such as patch size and batch size.
    - Saves the configuration to a Python file for training use.

    It supports both 2D and 3D datasets, optional background removal, and normalization tailored for CT images.

    Parameters
    ----------
    img_path : str
        Path to the collection containing raw input images.
    msk_path : str
        Path to the collection containing corresponding segmentation masks.
    num_classes : int
        Number of segmentation classes (excluding background).
    config_dir : str
        Directory where the auto-generated configuration file will be saved.
    base_config : str
        Path to the base configuration template (Python file).
    img_outpath : str, optional
        Output path for preprocessed images.
    msk_outpath : str, optional
        Output path for preprocessed masks.
    use_one_hot : bool, default=False
        Whether to convert the segmentation masks to one-hot encoded format.
    ct_norm : bool, default=False
        If True, compute normalization statistics and intensity clipping based only on regions inside the masks.
    remove_bg : bool, default=False
        Whether to exclude the background class during training (useful with sigmoid output).
    use_tif : bool, default=False
        If True, save the processed files in `.tif` format instead of `.npy`.
    desc : str, default="unet"
        Descriptor string saved in the config to identify the model/config.
    max_dim : int, default=128
        Maximum spatial size (in voxels) allowed for the input patch during training.
    num_epochs : int, default=1000
        Number of training epochs to set in the config file.
    num_workers : int, default=6
        Number of workers used for data loading during training.
    skip_preprocessing : bool, default=False
        If True, skip the preprocessing step and only generate the config.
    no_auto_config : bool, default=False
        If True, skip the config generation and only run preprocessing.
    logs_dir : str, default='logs/'
        Directory path to store logs (saved in the config).
    print_param : bool, default=False
        If True, print computed auto-config parameters to stdout.
    debug : bool, default=False
        If True, run preprocessing with verbose logging and no progress bar.
    is_2d : bool, default=False
        Whether the dataset is 2D instead of 3D.
    """
    median_size, median_spacing, mean, std, perc_005, perc_995 = data_fingerprint(img_path, msk_path if ct_norm else None)
    if not print_param:
        print("Data fingerprint:")
        print("Median size:", median_size)
        print("Median spacing:", median_spacing)
        print("Mean intensity:", mean)
        print("Standard deviation of intensities:", std)
        print("0.5% percentile of intensities:", perc_005)
        print("99.5% percentile of intensities:", perc_995)
        print("")

    if ct_norm:
        if not print_param: print("Computing data fingerprint for CT normalization...")
        clipping_bounds = [perc_005, perc_995]
        intensity_moments = [mean, std]
        if not print_param: print("Done!")
    else:
        clipping_bounds = []
        intensity_moments = []

    p=Preprocessing(
        img_path=img_path,
        msk_path=msk_path,
        img_outpath=img_outpath,
        msk_outpath=msk_outpath,
        num_classes=num_classes+1,
        use_one_hot=use_one_hot,
        remove_bg=remove_bg,
        use_tif=use_tif,
        median_spacing=median_spacing,
        median_size=median_size,
        clipping_bounds=clipping_bounds,
        intensity_moments=intensity_moments,
        is_2d=is_2d,
    )


    if not skip_preprocessing:
        p.run(debug=debug)


    if not no_auto_config:
        if not print_param: print("Start auto-configuration")
        handler = DataHandlerFactory.get(
            img_path,
            read_only=True,
            output=None,
        )

        

        batch, aug_patch, patch, pool = auto_config(
            median=(1, *p.median_size) if is_2d else p.median_size,
            img_path=img_path if p.median_size is None else None,
            max_dims=(max_dim, max_dim, max_dim),
            max_batch = len(handler)//20, # we limit batch to avoid overfitting
            )
        
        # convert path for windows systems before writing them
        if platform=='win32':
            if p.csv_path is not None: p.csv_path = p.csv_path.replace('\\','\\\\')

        config_path = save_python_config(
            config_dir=config_dir,
            base_config=base_config,

            # store hyper-parameters in the config file:
            IMG_PATH=p.img_outpath,
            MSK_PATH=p.msk_outpath,
            FG_PATH=p.fg_outpath,
            CSV_DIR=p.csv_path,
            NUM_CLASSES=num_classes,
            NUM_CHANNELS=p.num_channels,
            CHANNEL_AXIS=p.channel_axis,
            BATCH_SIZE=batch,
            AUG_PATCH_SIZE=aug_patch,
            PATCH_SIZE=patch,
            NUM_POOLS=pool,
            MEDIAN_SPACING=median_spacing,
            CLIPPING_BOUNDS=clipping_bounds,
            INTENSITY_MOMENTS=intensity_moments,
            DESC=desc,
            NB_EPOCHS=num_epochs,
            NUM_WORKERS=num_workers,
            LOG_DIR=logs_dir,
            IS_2D=is_2d,
        )

        if not print_param: print("Auto-config done! Configuration saved in: ", config_path)
        if print_param:
            print(batch)
            print(patch)
            print(aug_patch)
            print(pool)
            print(config_path)

        return config_path


if __name__=='__main__':

    parser = argparse.ArgumentParser(description="Dataset preprocessing for training purpose.")
    parser.add_argument("--img_path","--img_dir",dest="img_path", type=str,required=True,
        help="Path of the images collection")
    parser.add_argument("--msk_path","--msk_dir",dest="msk_path", type=str, default=None,
        help="(default=None) Path to the masks/labels collection")
    parser.add_argument("--img_outpath","--img_outdir",dest="img_outpath", type=str, default=None,
        help="(default=None : Current directory) Path to the ouput of the preprocessed images")
    parser.add_argument("--msk_outpath","--msk_outdir",dest="msk_outpath", type=str, default=None,
        help="(default=None : Current directory) Path to the output of the preprocessed masks/labels")
    parser.add_argument("--num_classes", type=int, default=1,
        help="(default=1) Number of classes (types of objects) in the dataset. The background is not included.")
    parser.add_argument("--max_dim", type=int, default=128,
        help="(default=128) max_dim^3 determines the maximum size of patch for auto-config.")
    parser.add_argument("--num_epochs", type=int, default=1000,
        help="(default=1000) Number of epochs for the training.")
    parser.add_argument("--num_workers", type=int, default=6,
        help="(default=6) Number of workers for the training. Half of it will be used for validation.")
    parser.add_argument("--config_dir", type=str, default='configs/',
        help="(default=\'configs/\') Configuration folder to save the auto-configuration.")
    parser.add_argument("--logs_dir", type=str, default='logs/',
        help="(default=\'logs/\') Builder output folder to save the model.")
    parser.add_argument("--base_config", type=str, default=None,
        help="(default=None) Optional. Path to an existing configuration file which will be updated with the preprocessed values.")
    parser.add_argument("--desc", type=str, default='unet_default',
        help="(default=unet_default) Optional. A name used to describe the model.")
    parser.add_argument("--use_tif", default=False,  action='store_true', dest='use_tif',
        help="(default=False) Whether to use tif format to save the preprocessed images instead of npy format. Tif files are easily readable with viewers such as Napari and takes fewer disk space but are slower to load and may slow down the training process.") 
    parser.add_argument("--use_one_hot", default=False,  action='store_true', dest='use_one_hot',
        help="(default=False) Whether to use one hot encoding of the mask. Can slow down the training.") 
    parser.add_argument("--remove_bg", default=False,  action='store_true', dest='remove_bg',
        help="(default=False) If use one hot, remove the background in masks. Remove the bg to use with sigmoid activation maps (not softmax).") 
    parser.add_argument("--no_auto_config", default=False,  action='store_true', dest='no_auto_config',
        help="(default=False) For debugging, deactivate auto-configuration.") 
    parser.add_argument("--ct_norm", default=False,  action='store_true', dest='ct_norm',
        help="(default=False) Whether to use CT-Scan normalization routine (cf. nnUNet).") 
    parser.add_argument("--skip_preprocessing", default=False,  action='store_true', dest='skip_preprocessing',
        help="(default=False) Whether to skip the preprocessing. Only for debugging.") 
    parser.add_argument("--remote", default=False,  action='store_true', dest='remote',
        help="(default=False) Whether to print auto-config parameters. Used for remote preprocessing using the GUI.") 
    parser.add_argument("--debug", default=False,  action='store_true', dest='debug',
        help="(default=False) Debug mode. Whether to print all image filenames while preprocessing.") 
    parser.add_argument("--is_2d", default=False,dest='is_2d',
        help="(default=False) Whether the image is 2d.")
    args = parser.parse_args()

    auto_config_preprocess(
        img_path=args.img_path, 
        msk_path=args.msk_path, 
        num_classes=args.num_classes, 
        config_dir=args.config_dir, 
        base_config=args.base_config, 
        img_outpath=args.img_outpath,
        msk_outpath=args.msk_outpath,
        use_one_hot=args.use_one_hot,
        ct_norm=args.ct_norm,
        remove_bg=args.remove_bg, 
        use_tif=args.use_tif,
        desc=args.desc, 
        max_dim=args.max_dim,
        num_epochs=args.num_epochs,
        num_workers=args.num_workers,
        skip_preprocessing=args.skip_preprocessing,
        no_auto_config=args.no_auto_config,
        logs_dir=args.logs_dir,
        print_param=args.remote,
        debug=args.debug,
        is_2d=args.is_2d,
        )

#---------------------------------------------------------------------------