Slicing¶

`sahi.slicing` ¶

Classes¶

`SliceImageResult` ¶

Source code in sahi/slicing.py

class SliceImageResult:
    def __init__(self, original_image_size: List[int], image_dir: Optional[str] = None):
        """
        image_dir: str
            Directory of the sliced image exports.
        original_image_size: list of int
            Size of the unsliced original image in [height, width]
        """
        self.original_image_height = original_image_size[0]
        self.original_image_width = original_image_size[1]
        self.image_dir = image_dir

        self._sliced_image_list: List[SlicedImage] = []

    def add_sliced_image(self, sliced_image: SlicedImage):
        if not isinstance(sliced_image, SlicedImage):
            raise TypeError("sliced_image must be a SlicedImage instance")

        self._sliced_image_list.append(sliced_image)

    @property
    def sliced_image_list(self):
        return self._sliced_image_list

    @property
    def images(self):
        """Returns sliced images.

        Returns:
            images: a list of np.array
        """
        images = []
        for sliced_image in self._sliced_image_list:
            images.append(sliced_image.image)
        return images

    @property
    def coco_images(self) -> List[CocoImage]:
        """Returns CocoImage representation of SliceImageResult.

        Returns:
            coco_images: a list of CocoImage
        """
        coco_images: List = []
        for sliced_image in self._sliced_image_list:
            coco_images.append(sliced_image.coco_image)
        return coco_images

    @property
    def starting_pixels(self) -> List[int]:
        """Returns a list of starting pixels for each slice.

        Returns:
            starting_pixels: a list of starting pixel coords [x,y]
        """
        starting_pixels = []
        for sliced_image in self._sliced_image_list:
            starting_pixels.append(sliced_image.starting_pixel)
        return starting_pixels

    @property
    def filenames(self) -> List[int]:
        """Returns a list of filenames for each slice.

        Returns:
            filenames: a list of filenames as str
        """
        filenames = []
        for sliced_image in self._sliced_image_list:
            filenames.append(sliced_image.coco_image.file_name)
        return filenames

    def __getitem__(self, i):
        def _prepare_ith_dict(i):
            return {
                "image": self.images[i],
                "coco_image": self.coco_images[i],
                "starting_pixel": self.starting_pixels[i],
                "filename": self.filenames[i],
            }

        if isinstance(i, np.ndarray):
            i = i.tolist()

        if isinstance(i, int):
            return _prepare_ith_dict(i)
        elif isinstance(i, slice):
            start, stop, step = i.indices(len(self))
            return [_prepare_ith_dict(i) for i in range(start, stop, step)]
        elif isinstance(i, (tuple, list)):
            accessed_mapping = map(_prepare_ith_dict, i)
            return list(accessed_mapping)
        else:
            raise NotImplementedError(f"{type(i)}")

    def __len__(self):
        return len(self._sliced_image_list)

Attributes¶

`coco_images` `property` ¶

Returns CocoImage representation of SliceImageResult.

Returns:

Name	Type	Description
`coco_images`	`List[CocoImage]`	a list of CocoImage

`filenames` `property` ¶

Returns a list of filenames for each slice.

Returns:

Name	Type	Description
`filenames`	`List[int]`	a list of filenames as str

`images` `property` ¶

Returns sliced images.

Returns:

Name	Type	Description
`images`		a list of np.array

`starting_pixels` `property` ¶

Returns a list of starting pixels for each slice.

Returns:

Name	Type	Description
`starting_pixels`	`List[int]`	a list of starting pixel coords [x,y]

Functions¶

`init(original_image_size, image_dir=None)` ¶

str

Directory of the sliced image exports.

original_image_size: list of int Size of the unsliced original image in [height, width]

Source code in sahi/slicing.py

def __init__(self, original_image_size: List[int], image_dir: Optional[str] = None):
    """
    image_dir: str
        Directory of the sliced image exports.
    original_image_size: list of int
        Size of the unsliced original image in [height, width]
    """
    self.original_image_height = original_image_size[0]
    self.original_image_width = original_image_size[1]
    self.image_dir = image_dir

    self._sliced_image_list: List[SlicedImage] = []

`SlicedImage` ¶

Source code in sahi/slicing.py

class SlicedImage:
    def __init__(self, image, coco_image, starting_pixel):
        """
        image: np.array
            Sliced image.
        coco_image: CocoImage
            Coco styled image object that belong to sliced image.
        starting_pixel: list of list of int
            Starting pixel coordinates of the sliced image.
        """
        self.image = image
        self.coco_image = coco_image
        self.starting_pixel = starting_pixel

Functions¶

`init(image, coco_image, starting_pixel)` ¶

np.array

Sliced image.

coco_image: CocoImage Coco styled image object that belong to sliced image. starting_pixel: list of list of int Starting pixel coordinates of the sliced image.

Source code in sahi/slicing.py

def __init__(self, image, coco_image, starting_pixel):
    """
    image: np.array
        Sliced image.
    coco_image: CocoImage
        Coco styled image object that belong to sliced image.
    starting_pixel: list of list of int
        Starting pixel coordinates of the sliced image.
    """
    self.image = image
    self.coco_image = coco_image
    self.starting_pixel = starting_pixel

Functions¶

`annotation_inside_slice(annotation, slice_bbox)` ¶

Check whether annotation coordinates lie inside slice coordinates.

Parameters:

Name	Type	Description	Default
`annotation` ¶	`dict`	Single annotation entry in COCO format.	required
`slice_bbox` ¶	`List[int]`	Generated from `get_slice_bboxes`. Format for each slice bbox: [x_min, y_min, x_max, y_max].	required

Returns:

Type	Description
`bool`	True if any annotation coordinate lies inside slice.

Source code in sahi/slicing.py

def annotation_inside_slice(annotation: Dict, slice_bbox: List[int]) -> bool:
    """Check whether annotation coordinates lie inside slice coordinates.

    Args:
        annotation (dict): Single annotation entry in COCO format.
        slice_bbox (List[int]): Generated from `get_slice_bboxes`.
            Format for each slice bbox: [x_min, y_min, x_max, y_max].

    Returns:
        (bool): True if any annotation coordinate lies inside slice.
    """
    left, top, width, height = annotation["bbox"]

    right = left + width
    bottom = top + height

    if left >= slice_bbox[2]:
        return False
    if top >= slice_bbox[3]:
        return False
    if right <= slice_bbox[0]:
        return False
    if bottom <= slice_bbox[1]:
        return False

    return True

`calc_aspect_ratio_orientation(width, height)` ¶

Parameters:

Name	Type	Description	Default
`width` ¶	`int`		required
`height` ¶	`int`		required

Returns:

Type	Description
`str`	image capture orientation

Source code in sahi/slicing.py

def calc_aspect_ratio_orientation(width: int, height: int) -> str:
    """

    Args:
        width:
        height:

    Returns:
        image capture orientation
    """

    if width < height:
        return "vertical"
    elif width > height:
        return "horizontal"
    else:
        return "square"

`calc_ratio_and_slice(orientation, slide=1, ratio=0.1)` ¶

According to image resolution calculation overlap params Args: orientation: image capture angle slide: sliding window ratio: buffer value

Returns:

Type	Description
	overlap params

Source code in sahi/slicing.py

def calc_ratio_and_slice(orientation: Literal["vertical", "horizontal", "square"], slide: int = 1, ratio: float = 0.1):
    """
    According to image resolution calculation overlap params
    Args:
        orientation: image capture angle
        slide: sliding window
        ratio: buffer value

    Returns:
        overlap params
    """
    if orientation == "vertical":
        slice_row, slice_col, overlap_height_ratio, overlap_width_ratio = slide, slide * 2, ratio, ratio
    elif orientation == "horizontal":
        slice_row, slice_col, overlap_height_ratio, overlap_width_ratio = slide * 2, slide, ratio, ratio
    elif orientation == "square":
        slice_row, slice_col, overlap_height_ratio, overlap_width_ratio = slide, slide, ratio, ratio
    else:
        raise ValueError(f"Invalid orientation: {orientation}. Must be one of 'vertical', 'horizontal', or 'square'.")

    return slice_row, slice_col, overlap_height_ratio, overlap_width_ratio  # noqa

`calc_resolution_factor(resolution)` ¶

According to image resolution calculate power(2,n) and return the closest smaller n. Args: resolution: the width and height of the image multiplied. such as 1024x720 = 737280

Returns:

Source code in sahi/slicing.py

def calc_resolution_factor(resolution: int) -> int:
    """
    According to image resolution calculate power(2,n) and return the closest smaller `n`.
    Args:
        resolution: the width and height of the image multiplied. such as 1024x720 = 737280

    Returns:

    """
    expo = 0
    while np.power(2, expo) < resolution:
        expo += 1

    return expo - 1

`calc_slice_and_overlap_params(resolution, height, width, orientation)` ¶

This function calculate according to image resolution slice and overlap params. Args: resolution: str height: int width: int orientation: str

Returns:

Type	Description
`Tuple[int, int, int, int]`	x_overlap, y_overlap, slice_width, slice_height

Source code in sahi/slicing.py

def calc_slice_and_overlap_params(
    resolution: str, height: int, width: int, orientation: str
) -> Tuple[int, int, int, int]:
    """
    This function calculate according to image resolution slice and overlap params.
    Args:
        resolution: str
        height: int
        width: int
        orientation: str

    Returns:
        x_overlap, y_overlap, slice_width, slice_height
    """

    if resolution == "medium":
        split_row, split_col, overlap_height_ratio, overlap_width_ratio = calc_ratio_and_slice(
            orientation, slide=1, ratio=0.8
        )

    elif resolution == "high":
        split_row, split_col, overlap_height_ratio, overlap_width_ratio = calc_ratio_and_slice(
            orientation, slide=2, ratio=0.4
        )

    elif resolution == "ultra-high":
        split_row, split_col, overlap_height_ratio, overlap_width_ratio = calc_ratio_and_slice(
            orientation, slide=4, ratio=0.4
        )
    else:  # low condition
        split_col = 1
        split_row = 1
        overlap_width_ratio = 1
        overlap_height_ratio = 1

    slice_height = height // split_col
    slice_width = width // split_row

    x_overlap = int(slice_width * overlap_width_ratio)
    y_overlap = int(slice_height * overlap_height_ratio)

    return x_overlap, y_overlap, slice_width, slice_height

`get_auto_slice_params(height, width)` ¶

According to Image HxW calculate overlap sliding window and buffer params factor is the power value of 2 closest to the image resolution. factor <= 18: low resolution image such as 300x300, 640x640 18 < factor <= 21: medium resolution image such as 1024x1024, 1336x960 21 < factor <= 24: high resolution image such as 2048x2048, 2048x4096, 4096x4096 factor > 24: ultra-high resolution image such as 6380x6380, 4096x8192 Args: height: width:

Returns:

Type	Description
`Tuple[int, int, int, int]`	slicing overlap params x_overlap, y_overlap, slice_width, slice_height

Source code in sahi/slicing.py

def get_auto_slice_params(height: int, width: int) -> Tuple[int, int, int, int]:
    """
    According to Image HxW calculate overlap sliding window and buffer params
    factor is the power value of 2 closest to the image resolution.
        factor <= 18: low resolution image such as 300x300, 640x640
        18 < factor <= 21: medium resolution image such as 1024x1024, 1336x960
        21 < factor <= 24: high resolution image such as 2048x2048, 2048x4096, 4096x4096
        factor > 24: ultra-high resolution image such as 6380x6380, 4096x8192
    Args:
        height:
        width:

    Returns:
        slicing overlap params x_overlap, y_overlap, slice_width, slice_height
    """
    resolution = height * width
    factor = calc_resolution_factor(resolution)
    if factor <= 18:
        return get_resolution_selector("low", height=height, width=width)
    elif 18 <= factor < 21:
        return get_resolution_selector("medium", height=height, width=width)
    elif 21 <= factor < 24:
        return get_resolution_selector("high", height=height, width=width)
    else:
        return get_resolution_selector("ultra-high", height=height, width=width)

`get_resolution_selector(res, height, width)` ¶

Parameters:

Name	Type	Description	Default
`res` ¶	`str`	resolution of image such as low, medium	required
`height` ¶	`int`		required
`width` ¶	`int`		required

Returns:

Type	Description
`Tuple[int, int, int, int]`	trigger slicing params function and return overlap params

Source code in sahi/slicing.py

def get_resolution_selector(res: str, height: int, width: int) -> Tuple[int, int, int, int]:
    """

    Args:
        res: resolution of image such as low, medium
        height:
        width:

    Returns:
        trigger slicing params function and return overlap params
    """
    orientation = calc_aspect_ratio_orientation(width=width, height=height)
    x_overlap, y_overlap, slice_width, slice_height = calc_slice_and_overlap_params(
        resolution=res, height=height, width=width, orientation=orientation
    )

    return x_overlap, y_overlap, slice_width, slice_height

`get_slice_bboxes(image_height, image_width, slice_height=None, slice_width=None, auto_slice_resolution=True, overlap_height_ratio=0.2, overlap_width_ratio=0.2)` ¶

Generate bounding boxes for slicing an image into crops.

The function calculates the coordinates for each slice based on the provided image dimensions, slice size, and overlap ratios. If slice size is not provided and auto_slice_resolution is True, the function will automatically determine appropriate slice parameters.

Parameters:

Name	Type	Description	Default
`image_height` ¶	`int`	Height of the original image.	required
`image_width` ¶	`int`	Width of the original image.	required
`slice_height` ¶	`int`	Height of each slice. Default None.	`None`
`slice_width` ¶	`int`	Width of each slice. Default None.	`None`
`overlap_height_ratio` ¶	`float`	Fractional overlap in height of each slice (e.g. an overlap of 0.2 for a slice of size 100 yields an overlap of 20 pixels). Default 0.2.	`0.2`
`overlap_width_ratio(float,` ¶	`optional`	Fractional overlap in width of each slice (e.g. an overlap of 0.2 for a slice of size 100 yields an overlap of 20 pixels). Default 0.2.	required
`auto_slice_resolution` ¶	`bool`	if not set slice parameters such as slice_height and slice_width, it enables automatically calculate these parameters from image resolution and orientation.	`True`

Returns:

Type	Description
`List[List[int]]`	List[List[int]]: List of 4 corner coordinates for each N slices. [ [slice_0_left, slice_0_top, slice_0_right, slice_0_bottom], ... [slice_N_left, slice_N_top, slice_N_right, slice_N_bottom] ]

Source code in sahi/slicing.py

def get_slice_bboxes(
    image_height: int,
    image_width: int,
    slice_height: Optional[int] = None,
    slice_width: Optional[int] = None,
    auto_slice_resolution: Optional[bool] = True,
    overlap_height_ratio: Optional[float] = 0.2,
    overlap_width_ratio: Optional[float] = 0.2,
) -> List[List[int]]:
    """Generate bounding boxes for slicing an image into crops.

    The function calculates the coordinates for each slice based on the provided
    image dimensions, slice size, and overlap ratios. If slice size is not provided
    and auto_slice_resolution is True, the function will automatically determine
    appropriate slice parameters.

    Args:
        image_height (int): Height of the original image.
        image_width (int): Width of the original image.
        slice_height (int, optional): Height of each slice. Default None.
        slice_width (int, optional): Width of each slice. Default None.
        overlap_height_ratio (float, optional): Fractional overlap in height of each
            slice (e.g. an overlap of 0.2 for a slice of size 100 yields an
            overlap of 20 pixels). Default 0.2.
        overlap_width_ratio(float, optional): Fractional overlap in width of each
            slice (e.g. an overlap of 0.2 for a slice of size 100 yields an
            overlap of 20 pixels). Default 0.2.
        auto_slice_resolution (bool, optional): if not set slice parameters such as slice_height and slice_width,
            it enables automatically calculate these parameters from image resolution and orientation.

    Returns:
        List[List[int]]: List of 4 corner coordinates for each N slices.
            [
                [slice_0_left, slice_0_top, slice_0_right, slice_0_bottom],
                ...
                [slice_N_left, slice_N_top, slice_N_right, slice_N_bottom]
            ]
    """
    slice_bboxes = []
    y_max = y_min = 0

    if slice_height and slice_width:
        y_overlap = int(overlap_height_ratio * slice_height)
        x_overlap = int(overlap_width_ratio * slice_width)
    elif auto_slice_resolution:
        x_overlap, y_overlap, slice_width, slice_height = get_auto_slice_params(height=image_height, width=image_width)
    else:
        raise ValueError("Compute type is not auto and slice width and height are not provided.")

    while y_max < image_height:
        x_min = x_max = 0
        y_max = y_min + slice_height
        while x_max < image_width:
            x_max = x_min + slice_width
            if y_max > image_height or x_max > image_width:
                xmax = min(image_width, x_max)
                ymax = min(image_height, y_max)
                xmin = max(0, xmax - slice_width)
                ymin = max(0, ymax - slice_height)
                slice_bboxes.append([xmin, ymin, xmax, ymax])
            else:
                slice_bboxes.append([x_min, y_min, x_max, y_max])
            x_min = x_max - x_overlap
        y_min = y_max - y_overlap
    return slice_bboxes

`process_coco_annotations(coco_annotation_list, slice_bbox, min_area_ratio)` ¶

Slices and filters given list of CocoAnnotation objects with given 'slice_bbox' and 'min_area_ratio'.

Parameters:

Name	Type	Description	Default
`slice_bbox` ¶	`List[int]`	Generated from `get_slice_bboxes`. Format for each slice bbox: [x_min, y_min, x_max, y_max].	required
`min_area_ratio` ¶	`float`	If the cropped annotation area to original annotation ratio is smaller than this value, the annotation is filtered out. Default 0.1.	required

Returns:

Type	Description
`List[CocoAnnotation]`	Sliced annotations.

Source code in sahi/slicing.py

def process_coco_annotations(
    coco_annotation_list: List[CocoAnnotation], slice_bbox: List[int], min_area_ratio
) -> List[CocoAnnotation]:
    """Slices and filters given list of CocoAnnotation objects with given
    'slice_bbox' and 'min_area_ratio'.

    Args:
        coco_annotation_list (List[CocoAnnotation])
        slice_bbox (List[int]): Generated from `get_slice_bboxes`.
            Format for each slice bbox: [x_min, y_min, x_max, y_max].
        min_area_ratio (float): If the cropped annotation area to original
            annotation ratio is smaller than this value, the annotation is
            filtered out. Default 0.1.

    Returns:
        (List[CocoAnnotation]): Sliced annotations.
    """

    sliced_coco_annotation_list: List[CocoAnnotation] = []
    for coco_annotation in coco_annotation_list:
        if annotation_inside_slice(coco_annotation.json, slice_bbox):
            sliced_coco_annotation = coco_annotation.get_sliced_coco_annotation(slice_bbox)
            if sliced_coco_annotation.area / coco_annotation.area >= min_area_ratio:
                sliced_coco_annotation_list.append(sliced_coco_annotation)
    return sliced_coco_annotation_list

`shift_bboxes(bboxes, offset)` ¶

Shift bboxes w.r.t offset.

Suppo

Parameters:

Name	Type	Description	Default
`bboxes` ¶	`(Tensor, ndarray, list)`	The bboxes need to be translated. Its shape can be (n, 4), which means (x, y, x, y).	required
`offset` ¶	`Sequence[int]`	The translation offsets with shape of (2, ).	required

Returns: Tensor, np.ndarray, list: Shifted bboxes.

Source code in sahi/slicing.py

def shift_bboxes(bboxes, offset: Sequence[int]):
    """
    Shift bboxes w.r.t offset.

    Suppo

    Args:
        bboxes (Tensor, np.ndarray, list): The bboxes need to be translated. Its shape can
            be (n, 4), which means (x, y, x, y).
        offset (Sequence[int]): The translation offsets with shape of (2, ).
    Returns:
        Tensor, np.ndarray, list: Shifted bboxes.
    """
    shifted_bboxes = []

    if type(bboxes).__module__ == "torch":
        bboxes_is_torch_tensor = True
    else:
        bboxes_is_torch_tensor = False

    for bbox in bboxes:
        if bboxes_is_torch_tensor or isinstance(bbox, np.ndarray):
            bbox = bbox.tolist()
        bbox = BoundingBox(bbox, shift_amount=offset)
        bbox = bbox.get_shifted_box()
        shifted_bboxes.append(bbox.to_xyxy())

    if isinstance(bboxes, np.ndarray):
        return np.stack(shifted_bboxes, axis=0)
    elif bboxes_is_torch_tensor:
        return bboxes.new_tensor(shifted_bboxes)
    else:
        return shifted_bboxes

`shift_masks(masks, offset, full_shape)` ¶

Shift masks to the original image. Args: masks (np.ndarray): masks that need to be shifted. offset (Sequence[int]): The offset to translate with shape of (2, ). full_shape (Sequence[int]): A (height, width) tuple of the huge image's shape. Returns: np.ndarray: Shifted masks.

Source code in sahi/slicing.py

def shift_masks(masks: np.ndarray, offset: Sequence[int], full_shape: Sequence[int]) -> np.ndarray:
    """Shift masks to the original image.
    Args:
        masks (np.ndarray): masks that need to be shifted.
        offset (Sequence[int]): The offset to translate with shape of (2, ).
        full_shape (Sequence[int]): A (height, width) tuple of the huge image's shape.
    Returns:
        np.ndarray: Shifted masks.
    """
    # empty masks
    if masks is None:
        return masks

    shifted_masks = []
    for mask in masks:
        mask = Mask(segmentation=mask, shift_amount=offset, full_shape=full_shape)
        mask = mask.get_shifted_mask()
        shifted_masks.append(mask.bool_mask)

    return np.stack(shifted_masks, axis=0)

`slice_coco(coco_annotation_file_path, image_dir, output_coco_annotation_file_name, output_dir=None, ignore_negative_samples=False, slice_height=512, slice_width=512, overlap_height_ratio=0.2, overlap_width_ratio=0.2, min_area_ratio=0.1, out_ext=None, verbose=False)` ¶

Slice large images given in a directory, into smaller windows. If output_dir is given, export sliced images and coco file.

Parameters:

Name	Type	Description	Default
`coco_annotation_file_path` ¶	`str`	Location of the coco annotation file	required
`image_dir` ¶	`str`	Base directory for the images	required
`output_coco_annotation_file_name` ¶	`str`	File name of the exported coco dataset json.	required
`output_dir` ¶	`str`	Output directory	`None`
`ignore_negative_samples` ¶	`bool`	If True, images without annotations are ignored. Defaults to False.	`False`
`slice_height` ¶	`int`	Height of each slice. Default 512.	`512`
`slice_width` ¶	`int`	Width of each slice. Default 512.	`512`
`overlap_height_ratio` ¶	`float`	Fractional overlap in height of each slice (e.g. an overlap of 0.2 for a slice of size 100 yields an overlap of 20 pixels). Default 0.2.	`0.2`
`overlap_width_ratio` ¶	`float`	Fractional overlap in width of each slice (e.g. an overlap of 0.2 for a slice of size 100 yields an overlap of 20 pixels). Default 0.2.	`0.2`
`min_area_ratio` ¶	`float`	If the cropped annotation area to original annotation ratio is smaller than this value, the annotation is filtered out. Default 0.1.	`0.1`
`out_ext` ¶	`str`	Extension of saved images. Default is the original suffix.	`None`
`verbose` ¶	`bool`	Switch to print relevant values to screen. Default 'False'.	`False`

Returns:

Name	Type	Description
`coco_dict`	`List[Union[Dict, str]]`	dict COCO dict for sliced images and annotations
`save_path`	`List[Union[Dict, str]]`	str Path to the saved coco file

Source code in sahi/slicing.py

def slice_coco(
    coco_annotation_file_path: str,
    image_dir: str,
    output_coco_annotation_file_name: str,
    output_dir: Optional[str] = None,
    ignore_negative_samples: Optional[bool] = False,
    slice_height: Optional[int] = 512,
    slice_width: Optional[int] = 512,
    overlap_height_ratio: Optional[float] = 0.2,
    overlap_width_ratio: Optional[float] = 0.2,
    min_area_ratio: Optional[float] = 0.1,
    out_ext: Optional[str] = None,
    verbose: Optional[bool] = False,
) -> List[Union[Dict, str]]:
    """
    Slice large images given in a directory, into smaller windows. If output_dir is given, export sliced images and coco file.

    Args:
        coco_annotation_file_path (str): Location of the coco annotation file
        image_dir (str): Base directory for the images
        output_coco_annotation_file_name (str): File name of the exported coco
            dataset json.
        output_dir (str, optional): Output directory
        ignore_negative_samples (bool, optional): If True, images without annotations
            are ignored. Defaults to False.
        slice_height (int, optional): Height of each slice. Default 512.
        slice_width (int, optional): Width of each slice. Default 512.
        overlap_height_ratio (float, optional): Fractional overlap in height of each
            slice (e.g. an overlap of 0.2 for a slice of size 100 yields an
            overlap of 20 pixels). Default 0.2.
        overlap_width_ratio (float, optional): Fractional overlap in width of each
            slice (e.g. an overlap of 0.2 for a slice of size 100 yields an
            overlap of 20 pixels). Default 0.2.
        min_area_ratio (float): If the cropped annotation area to original annotation
            ratio is smaller than this value, the annotation is filtered out. Default 0.1.
        out_ext (str, optional): Extension of saved images. Default is the
            original suffix.
        verbose (bool, optional): Switch to print relevant values to screen.
            Default 'False'.

    Returns:
        coco_dict: dict
            COCO dict for sliced images and annotations
        save_path: str
            Path to the saved coco file
    """

    # read coco file
    coco_dict: Dict = load_json(coco_annotation_file_path)
    # create image_id_to_annotation_list mapping
    coco = Coco.from_coco_dict_or_path(coco_dict)
    # init sliced coco_utils.CocoImage list
    sliced_coco_images: List = []

    # iterate over images and slice
    for idx, coco_image in enumerate(tqdm(coco.images)):
        # get image path
        image_path: str = os.path.join(image_dir, coco_image.file_name)
        # get annotation json list corresponding to selected coco image
        # slice image
        try:
            slice_image_result = slice_image(
                image=image_path,
                coco_annotation_list=coco_image.annotations,
                output_file_name=f"{Path(coco_image.file_name).stem}_{idx}",
                output_dir=output_dir,
                slice_height=slice_height,
                slice_width=slice_width,
                overlap_height_ratio=overlap_height_ratio,
                overlap_width_ratio=overlap_width_ratio,
                min_area_ratio=min_area_ratio,
                out_ext=out_ext,
                verbose=verbose,
            )
            # append slice outputs
            sliced_coco_images.extend(slice_image_result.coco_images)
        except TopologicalError:
            logger.warning(f"Invalid annotation found, skipping this image: {image_path}")

    # create and save coco dict
    coco_dict = create_coco_dict(
        sliced_coco_images, coco_dict["categories"], ignore_negative_samples=ignore_negative_samples
    )
    save_path = ""
    if output_coco_annotation_file_name and output_dir:
        save_path = Path(output_dir) / (output_coco_annotation_file_name + "_coco.json")
        save_json(coco_dict, save_path)

    return coco_dict, save_path

`slice_image(image, coco_annotation_list=None, output_file_name=None, output_dir=None, slice_height=None, slice_width=None, overlap_height_ratio=0.2, overlap_width_ratio=0.2, auto_slice_resolution=True, min_area_ratio=0.1, out_ext=None, verbose=False)` ¶

Slice a large image into smaller windows. If output_file_name and output_dir is given, export sliced images.

Parameters:

Name	Type	Description	Default
`image` ¶	`str or Image`	File path of image or Pillow Image to be sliced.	required
`coco_annotation_list` ¶	`List[CocoAnnotation]`	List of CocoAnnotation objects.	`None`
`output_file_name` ¶	`str`	Root name of output files (coordinates will be appended to this)	`None`
`output_dir` ¶	`str`	Output directory	`None`
`slice_height` ¶	`int`	Height of each slice. Default None.	`None`
`slice_width` ¶	`int`	Width of each slice. Default None.	`None`
`overlap_height_ratio` ¶	`float`	Fractional overlap in height of each slice (e.g. an overlap of 0.2 for a slice of size 100 yields an overlap of 20 pixels). Default 0.2.	`0.2`
`overlap_width_ratio` ¶	`float`	Fractional overlap in width of each slice (e.g. an overlap of 0.2 for a slice of size 100 yields an overlap of 20 pixels). Default 0.2.	`0.2`
`auto_slice_resolution` ¶	`bool`	if not set slice parameters such as slice_height and slice_width, it enables automatically calculate these params from image resolution and orientation.	`True`
`min_area_ratio` ¶	`float`	If the cropped annotation area to original annotation ratio is smaller than this value, the annotation is filtered out. Default 0.1.	`0.1`
`out_ext` ¶	`str`	Extension of saved images. Default is the original suffix for lossless image formats and png for lossy formats ('.jpg','.jpeg').	`None`
`verbose` ¶	`bool`	Switch to print relevant values to screen. Default 'False'.	`False`

Returns:

Name	Type	Description
`sliced_image_result`	`SliceImageResult`	SliceImageResult: sliced_image_list: list of SlicedImage image_dir: str Directory of the sliced image exports. original_image_size: list of int Size of the unsliced original image in [height, width]

Source code in sahi/slicing.py

def slice_image(
    image: Union[str, Image.Image],
    coco_annotation_list: Optional[List[CocoAnnotation]] = None,
    output_file_name: Optional[str] = None,
    output_dir: Optional[str] = None,
    slice_height: Optional[int] = None,
    slice_width: Optional[int] = None,
    overlap_height_ratio: Optional[float] = 0.2,
    overlap_width_ratio: Optional[float] = 0.2,
    auto_slice_resolution: Optional[bool] = True,
    min_area_ratio: Optional[float] = 0.1,
    out_ext: Optional[str] = None,
    verbose: Optional[bool] = False,
) -> SliceImageResult:
    """Slice a large image into smaller windows. If output_file_name and output_dir is given, export
    sliced images.

    Args:
        image (str or PIL.Image): File path of image or Pillow Image to be sliced.
        coco_annotation_list (List[CocoAnnotation], optional): List of CocoAnnotation objects.
        output_file_name (str, optional): Root name of output files (coordinates will
            be appended to this)
        output_dir (str, optional): Output directory
        slice_height (int, optional): Height of each slice. Default None.
        slice_width (int, optional): Width of each slice. Default None.
        overlap_height_ratio (float, optional): Fractional overlap in height of each
            slice (e.g. an overlap of 0.2 for a slice of size 100 yields an
            overlap of 20 pixels). Default 0.2.
        overlap_width_ratio (float, optional): Fractional overlap in width of each
            slice (e.g. an overlap of 0.2 for a slice of size 100 yields an
            overlap of 20 pixels). Default 0.2.
        auto_slice_resolution (bool, optional): if not set slice parameters such as slice_height and slice_width,
            it enables automatically calculate these params from image resolution and orientation.
        min_area_ratio (float, optional): If the cropped annotation area to original annotation
            ratio is smaller than this value, the annotation is filtered out. Default 0.1.
        out_ext (str, optional): Extension of saved images. Default is the
            original suffix for lossless image formats and png for lossy formats ('.jpg','.jpeg').
        verbose (bool, optional): Switch to print relevant values to screen.
            Default 'False'.

    Returns:
        sliced_image_result: SliceImageResult:
                                sliced_image_list: list of SlicedImage
                                image_dir: str
                                    Directory of the sliced image exports.
                                original_image_size: list of int
                                    Size of the unsliced original image in [height, width]
    """

    # define verboseprint
    verboselog = logger.info if verbose else lambda *a, **k: None

    def _export_single_slice(image: np.ndarray, output_dir: str, slice_file_name: str):
        image_pil = read_image_as_pil(image)
        slice_file_path = str(Path(output_dir) / slice_file_name)
        # export sliced image
        image_pil.save(slice_file_path)
        image_pil.close()  # to fix https://github.com/obss/sahi/issues/565
        verboselog("sliced image path: " + slice_file_path)

    # create outdir if not present
    if output_dir is not None:
        Path(output_dir).mkdir(parents=True, exist_ok=True)

    # read image
    image_pil = read_image_as_pil(image)
    verboselog("image.shape: " + str(image_pil.size))

    image_width, image_height = image_pil.size
    if not (image_width != 0 and image_height != 0):
        raise RuntimeError(f"invalid image size: {image_pil.size} for 'slice_image'.")
    slice_bboxes = get_slice_bboxes(
        image_height=image_height,
        image_width=image_width,
        auto_slice_resolution=auto_slice_resolution,
        slice_height=slice_height,
        slice_width=slice_width,
        overlap_height_ratio=overlap_height_ratio,
        overlap_width_ratio=overlap_width_ratio,
    )

    n_ims = 0

    # init images and annotations lists
    sliced_image_result = SliceImageResult(original_image_size=[image_height, image_width], image_dir=output_dir)

    image_pil_arr = np.asarray(image_pil)
    # iterate over slices
    for slice_bbox in slice_bboxes:
        n_ims += 1

        # extract image
        tlx = slice_bbox[0]
        tly = slice_bbox[1]
        brx = slice_bbox[2]
        bry = slice_bbox[3]
        image_pil_slice = image_pil_arr[tly:bry, tlx:brx]

        # set image file suffixes
        slice_suffixes = "_".join(map(str, slice_bbox))
        if out_ext:
            suffix = out_ext
        elif hasattr(image_pil, "filename"):
            suffix = Path(getattr(image_pil, "filename")).suffix
            if suffix in IMAGE_EXTENSIONS_LOSSY:
                suffix = ".png"
            elif suffix in IMAGE_EXTENSIONS_LOSSLESS:
                suffix = Path(image_pil.filename).suffix
        else:
            suffix = ".png"

        # set image file name and path
        slice_file_name = f"{output_file_name}_{slice_suffixes}{suffix}"

        # create coco image
        slice_width = slice_bbox[2] - slice_bbox[0]
        slice_height = slice_bbox[3] - slice_bbox[1]
        coco_image = CocoImage(file_name=slice_file_name, height=slice_height, width=slice_width)

        # append coco annotations (if present) to coco image
        if coco_annotation_list is not None:
            for sliced_coco_annotation in process_coco_annotations(coco_annotation_list, slice_bbox, min_area_ratio):
                coco_image.add_annotation(sliced_coco_annotation)

        # create sliced image and append to sliced_image_result
        sliced_image = SlicedImage(
            image=image_pil_slice, coco_image=coco_image, starting_pixel=[slice_bbox[0], slice_bbox[1]]
        )
        sliced_image_result.add_sliced_image(sliced_image)

    # export slices if output directory is provided
    if output_file_name and output_dir:
        conc_exec = concurrent.futures.ThreadPoolExecutor(max_workers=MAX_WORKERS)
        conc_exec.map(
            _export_single_slice,
            sliced_image_result.images,
            [output_dir] * len(sliced_image_result),
            sliced_image_result.filenames,
        )

    verboselog(
        "Num slices: " + str(n_ims) + " slice_height: " + str(slice_height) + " slice_width: " + str(slice_width)
    )

    return sliced_image_result

Slicing Utilities¶

Slice an image:

from sahi.slicing import slice_image

slice_image_result = slice_image(
    image=image_path,
    output_file_name=output_file_name,
    output_dir=output_dir,
    slice_height=256,
    slice_width=256,
    overlap_height_ratio=0.2,
    overlap_width_ratio=0.2,
)

Slice a COCO formatted dataset:

from sahi.slicing import slice_coco

coco_dict, coco_path = slice_coco(
    coco_annotation_file_path=coco_annotation_file_path,
    image_dir=image_dir,
    slice_height=256,
    slice_width=256,
    overlap_height_ratio=0.2,
    overlap_width_ratio=0.2,
)

Interactive Demo¶

Want to experiment with different slicing parameters and see their effects? Check out our interactive Jupyter notebook that demonstrates these slicing operations in action.

Slicing¶

sahi.slicing ¶

Classes¶

SliceImageResult ¶

Attributes¶

coco_images property ¶

filenames property ¶

images property ¶

starting_pixels property ¶

Functions¶

__init__(original_image_size, image_dir=None) ¶

SlicedImage ¶

Functions¶

__init__(image, coco_image, starting_pixel) ¶

Functions¶

annotation_inside_slice(annotation, slice_bbox) ¶

annotation ¶

slice_bbox ¶

calc_aspect_ratio_orientation(width, height) ¶

width ¶

height ¶

calc_ratio_and_slice(orientation, slide=1, ratio=0.1) ¶

calc_resolution_factor(resolution) ¶

calc_slice_and_overlap_params(resolution, height, width, orientation) ¶

get_auto_slice_params(height, width) ¶

get_resolution_selector(res, height, width) ¶

res ¶

height ¶

width ¶

get_slice_bboxes(image_height, image_width, slice_height=None, slice_width=None, auto_slice_resolution=True, overlap_height_ratio=0.2, overlap_width_ratio=0.2) ¶

image_height ¶

image_width ¶

slice_height ¶

slice_width ¶

overlap_height_ratio ¶

overlap_width_ratio(float, ¶

auto_slice_resolution ¶

process_coco_annotations(coco_annotation_list, slice_bbox, min_area_ratio) ¶

slice_bbox ¶

min_area_ratio ¶

shift_bboxes(bboxes, offset) ¶

bboxes ¶

offset ¶

shift_masks(masks, offset, full_shape) ¶

slice_coco(coco_annotation_file_path, image_dir, output_coco_annotation_file_name, output_dir=None, ignore_negative_samples=False, slice_height=512, slice_width=512, overlap_height_ratio=0.2, overlap_width_ratio=0.2, min_area_ratio=0.1, out_ext=None, verbose=False) ¶

coco_annotation_file_path ¶

image_dir ¶

output_coco_annotation_file_name ¶

output_dir ¶

ignore_negative_samples ¶

slice_height ¶

slice_width ¶

overlap_height_ratio ¶

overlap_width_ratio ¶

min_area_ratio ¶

out_ext ¶

verbose ¶

slice_image(image, coco_annotation_list=None, output_file_name=None, output_dir=None, slice_height=None, slice_width=None, overlap_height_ratio=0.2, overlap_width_ratio=0.2, auto_slice_resolution=True, min_area_ratio=0.1, out_ext=None, verbose=False) ¶

image ¶

coco_annotation_list ¶

output_file_name ¶

output_dir ¶

slice_height ¶

slice_width ¶

overlap_height_ratio ¶

overlap_width_ratio ¶

auto_slice_resolution ¶

min_area_ratio ¶

out_ext ¶

verbose ¶

Slicing Utilities¶

Interactive Demo¶

`sahi.slicing` ¶

`SliceImageResult` ¶

`coco_images` `property` ¶

`filenames` `property` ¶

`images` `property` ¶

`starting_pixels` `property` ¶

`init(original_image_size, image_dir=None)` ¶

`SlicedImage` ¶

`init(image, coco_image, starting_pixel)` ¶

`annotation_inside_slice(annotation, slice_bbox)` ¶

`annotation` ¶

`slice_bbox` ¶

`calc_aspect_ratio_orientation(width, height)` ¶

`width` ¶

`height` ¶

`calc_ratio_and_slice(orientation, slide=1, ratio=0.1)` ¶

`calc_resolution_factor(resolution)` ¶

`calc_slice_and_overlap_params(resolution, height, width, orientation)` ¶

`get_auto_slice_params(height, width)` ¶

`get_resolution_selector(res, height, width)` ¶

`res` ¶

`height` ¶

`width` ¶

`get_slice_bboxes(image_height, image_width, slice_height=None, slice_width=None, auto_slice_resolution=True, overlap_height_ratio=0.2, overlap_width_ratio=0.2)` ¶

`image_height` ¶

`image_width` ¶

`slice_height` ¶

`slice_width` ¶

`overlap_height_ratio` ¶

`overlap_width_ratio(float,` ¶

`auto_slice_resolution` ¶

`process_coco_annotations(coco_annotation_list, slice_bbox, min_area_ratio)` ¶

`slice_bbox` ¶

`min_area_ratio` ¶

`shift_bboxes(bboxes, offset)` ¶

`bboxes` ¶

`offset` ¶

`shift_masks(masks, offset, full_shape)` ¶

`slice_coco(coco_annotation_file_path, image_dir, output_coco_annotation_file_name, output_dir=None, ignore_negative_samples=False, slice_height=512, slice_width=512, overlap_height_ratio=0.2, overlap_width_ratio=0.2, min_area_ratio=0.1, out_ext=None, verbose=False)` ¶

`coco_annotation_file_path` ¶

`image_dir` ¶

`output_coco_annotation_file_name` ¶

`output_dir` ¶

`ignore_negative_samples` ¶

`slice_height` ¶

`slice_width` ¶

`overlap_height_ratio` ¶

`overlap_width_ratio` ¶

`min_area_ratio` ¶

`out_ext` ¶

`verbose` ¶

`slice_image(image, coco_annotation_list=None, output_file_name=None, output_dir=None, slice_height=None, slice_width=None, overlap_height_ratio=0.2, overlap_width_ratio=0.2, auto_slice_resolution=True, min_area_ratio=0.1, out_ext=None, verbose=False)` ¶

`image` ¶

`coco_annotation_list` ¶

`output_file_name` ¶

`output_dir` ¶

`slice_height` ¶

`slice_width` ¶

`overlap_height_ratio` ¶

`overlap_width_ratio` ¶

`auto_slice_resolution` ¶

`min_area_ratio` ¶

`out_ext` ¶

`verbose` ¶